From mboxrd@z Thu Jan 1 00:00:00 1970 Return-Path: Date: Sun, 18 Nov 2007 03:41:13 +0300 From: Alexey Tourbin To: ALT Devel discussion list Message-ID: <20071118004113.GE4801@solemn.turbinal> Mail-Followup-To: ALT Devel discussion list References: <473E0BD7.9080704@altlinux.com> <20071117050109.GJ31452@solemn.turbinal> <473E9A73.2000300@altlinux.com> Mime-Version: 1.0 Content-Type: multipart/signed; micalg=pgp-sha1; protocol="application/pgp-signature"; boundary="BZaMRJmqxGScZ8Mx" Content-Disposition: inline In-Reply-To: <473E9A73.2000300@altlinux.com> Subject: Re: [devel] python encodings X-BeenThere: devel@lists.altlinux.org X-Mailman-Version: 2.1.9 Precedence: list Reply-To: ALT Linux Team development discussions List-Id: ALT Linux Team development discussions List-Unsubscribe: , List-Archive: List-Post: List-Help: List-Subscribe: , X-List-Received-Date: Sun, 18 Nov 2007 00:41:20 -0000 Archived-At: List-Archive: List-Post: --BZaMRJmqxGScZ8Mx Content-Type: text/plain; charset=koi8-r Content-Disposition: inline Content-Transfer-Encoding: quoted-printable On Sat, Nov 17, 2007 at 10:38:27AM +0300, Anton Farygin wrote: > =ED=CE=C5 =CB=C1=D6=C5=D4=D3=D1, =DE=D4=CF =C4=CF=D3=D4=C1=D4=CF=DE=CE=CF= =C2=D9=CC=CF =C2=D9 =D7=D9=D7=C5=D3=D4=C9 =D7=CD=C5=CE=D1=C5=CD=D5=C0 =C4= =C9=C1=C7=CE=CF=D3=D4=C9=CB=D5. =F0=CF=20 > =CB=D2=C1=CA=CE=C5=CA =CD=C5=D2=C5 =D7 =CD=CF=A3=CD =D3=CC=D5=DE=C1=C5. =F1 =D3=C4=C5=CC=C1=CC =D7=CD=C5=CE=D1=C5=CD=D5=C0 =C4=C9=C1=C7=CE=CF=D3=D4= =C9=CB=D5, =CE=C1=D3=CB=CF=CC=D8=CB=CF =DC=D4=CF =D7=CF=DA=CD=CF=D6=CE=CF. $ hsh --init =2E. rpm-build-python-0.32-alt1 =2E.. $ hsh-shell $$ cd $$ echo '# coding: utf8' >test.py $$ /usr/lib/rpm/python.req test.py python.req: test.py: non-standard encoding: utf8 python2.4(encodings) python.req: ERROR: test.py:=20 python.req: maybe you need python-modules-encodings Traceback (most recent call last): File "/usr/lib/rpm/python.req.py", line 178, in ? import encodings ImportError: No module named encodings $$=20 =F7=CF=CF=C2=DD=C5-=D4=CF MemoryError =D7 =C4=C1=CE=CE=CF=CD =D3=CC=D5=DE= =C1=C5 -- =DC=D4=CF =D0=C9=D4=CF=CE=CF=D7=D3=CB=C9=CA =C2=C1=C7 http://bugs.python.org/issue979739 > > =E4=D5=CD=C1=C0, =DA=C1=C8=C1=DE=C9=D4=D8 =CE=C1 =DC=D4=D5 =D4=C5=CD=D5= python-base =C9=CC=C9 =CE=C5=D4. =F4=CF =C5=D3=D4=D8 =DE=D4=CF=C2=D9 =CF= =CE > > =D0=CF=CE=C9=CD=C1=CC =D0=CF=C2=CF=CC=D8=DB=C5 =CE=C1=D3=D4=C1=CE=C4=C1= =D2=D4=CE=D9=C8 =C1=CC=C9=C1=D3=CF=D7 =C4=CC=D1 =D3=D4=C1=CE=C4=C1=D2=D4=CE= =D9=C8 =CB=CF=C4=C9=D2=CF=D7=CF=CB, > > =C2=C5=DA =DA=C1=C7=CC=D1=C4=D9=D7=C1=CE=C9=D1 =D7 encodings. >=20 > =E5=D3=CC=C9 =CE=C5=D3=D4=C1=CE=D4=C1=D2=D4=CE=D9=C5 =C1=CC=C9=C1=D3=D9 = =D1=D7=CC=D1=C0=D4=D3=D1 =D3=D4=C1=CE=C4=C1=D2=D4=CF=CD =C4=C5-=C6=C1=CB=D4= =CF (=D4.=C5. -=20 > =DA=CE=C1=DE=C9=D4=C5=CC=D8=CE=CF =D2=C1=D3=D0=D2=CF=D3=D4=D2=C1=CE=C5=CE= =D9), =D4=CF =D7=C9=C4=C9=CD=CF =D3=D4=CF=C9=D4 =C8=C1=DE=C9=D4=D8 =D0=C9= =D4=CF=CE. =F7 =CF=C2=D2=C1=D4=CE=CF=CD=20 > =D3=CC=D5=DE=C1=C1=C5 - =D7=D9=D7=CF=C4=C9=D4=D8 =D7=CD=C5=CE=D1=C5=CD=D5= =C0 =C4=C9=C1=C7=CE=CF=D3=D4=C9=CB=D5 =C9 =D0=C1=D4=DE=C9=D4=D8 =D0=D2=C9= =CC=CF=D6=C5=CE=C9=D1. =F0=CF=D3=CD=CF=D4=D2=C9=CD, =CE=C1=D3=CB=CF=CC=D8=CB=CF =CF=CE=C9 =D2=C1= =D3=D0=D2=CF=D3=D4=D2=C1=CE=C5=CE=D9. Parser/tokenizer.c: 183 static char * 184 get_normal_name(char *s) /* for utf-8 and latin-1 */ 185 { 186 char buf[13]; 187 int i; 188 for (i =3D 0; i < 12; i++) { 189 int c =3D s[i]; 190 if (c =3D=3D '\0') break; 191 else if (c =3D=3D '_') buf[i] =3D '-'; 192 else buf[i] =3D tolower(c); 193 } 194 buf[i] =3D '\0'; 195 if (i > 3) { /* at least 4 characters */ 196 const char *p =3D NULL; 197 switch (buf[0]) { 198 case 'u': 199 if (strncmp(buf, "utf-8", 5) =3D=3D 0) 200 p =3D buf + 5; 201 else if (strncmp(buf, "utf8", 4) =3D=3D 0) 202 p =3D buf + 4; 203 if (p && (*p =3D=3D '\0' || *p =3D=3D '-')) 204 return "utf-8"; 205 break; 206 case 'i': 207 if (strncmp(buf, "utf-8") =3D=3D 0) 208 p =3D buf + 5; 209 =20 210 =20 211 =20 212 if (strcmp(buf, "utf-8") =3D=3D 0 || 213 strncmp(buf, "utf-8-", 6) =3D=3D 0) return "utf-8"; 214 else if (strcmp(buf, "latin-1") =3D=3D 0 || 215 strcmp(buf, "iso-8859-1") =3D=3D 0 || 216 strcmp(buf, "iso-latin-1") =3D=3D 0 || 217 strncmp(buf, "latin-1-", 8) =3D=3D 0 || 218 strncmp(buf, "iso-8859-1-", 11) =3D=3D 0 || 219 strncmp(buf, "iso-latin-1-", 12) =3D=3D 0) return = "iso-8859-1"; 220 else return s;gg 221 } =F4=CF =C5=D3=D4=D8 =D5 =D0=C9=D4=CF=CE=C1 =C5=D3=D4=D8 =C4=D7=C5 =D3=D4=C1= =CE=C4=C1=D2=D4=CE=D9=C5 =CB=CF=C4=C9=D2=CF=D7=CB=C9, =C4=CC=D1 =CB=CF=D4= =CF=D2=D9=C8 =D0=CF=DE=D4=C9 =CE=C9=DE=C5=C7=CF =CE=C5 =CE=D5=D6=CE=CF -- utf-8 =C9 iso-8859-1. =EE=CF = =D7 =CD=CF=C4=D5=CC=C5 encodings =CF=D0=D2=C5=C4=C5=CC=D1=C0=D4=D3=D1 =C4=CF=D0=CF=CC=CE=C9=D4=C5=CC=D8=CE= =D9=C5 =C1=CC=C9=C1=D3=D9, =D7 =D4=CF=CD =DE=C9=D3=CC=C5 =C4=CC=D1 =D3=D4= =C1=CE=C4=C1=D2=D4=CE=D9=C8 =CB=CF=C4=C9=D2=CF=D7=CF=CB. Lib/encodings/aliases.py: 395 # latin_1 codec 396 '8859' : 'latin_1', 397 'cp819' : 'latin_1', 398 'csisolatin1' : 'latin_1', 399 'ibm819' : 'latin_1', 400 'iso8859' : 'latin_1', 401 'iso_8859_1' : 'latin_1', 402 'iso_8859_1_1987' : 'latin_1', 403 'iso_ir_100' : 'latin_1', 404 'l1' : 'latin_1', 405 'latin' : 'latin_1', 406 'latin1' : 'latin_1', =2E.. 486 # utf_8 codec 487 'u8' : 'utf_8', 488 'utf' : 'utf_8', 489 'utf8' : 'utf_8', 490 'utf8_ucs2' : 'utf_8', 491 'utf8_ucs4' : 'utf_8', =E5=D3=D4=D8 =C9=D3=CB=D5=DB=C5=CE=C9=C5 =D7=CE=C5=D3=D4=C9 =CE=C5=CB=CF=D4= =CF=D2=D9=C5 =C9=DA =DC=D4=C9=C8 =C1=CC=C9=D3=CF=D7 =D7 Parser/tokenizer.c, =DE=D4=CF=C2=D9 =D5=CD=C5=CE=D8=DB=C9=D4=D8 =DE=C9=D3=CC=CF =D0=C1=C4=C5=CE= =C9=CA =D0=D2=C9 =CF=D4=D3=D5=D4=D3=D4=D7=C9=C9 encodings/aliases.py. =F0=CF=D3=CD=CF=D4=D2=C9=CD, =DE=D4=CF =C2=D5=C4=C5=D4 =D0=CF =D2=C5=DA=D5= =CC=D8=D4=C1=D4=C1=CD =D0=C5=D2=C5=D3=C2=CF=D2=CB=C9 =D3 =CE=CF=D7=D9=CD rp= m-build-python. =F0=CF=D4=CF=CD=D5 =DE=D4=CF =D4=C5=D0=C5=D2=D8 =D7 python.req.py =C2=D5=C4= =C5=D4 =C4=C9=C1=C7=CE=CF=D3=D4=C9=CB=C1 "non-standard encoding:", =CB=CF=D4=CF=D2=C1=D1 =CD=C9=CD=C9=CB=D2=C9=D2=D5=C5=D4 =D0=D2=CF=D7=C5=D2= =CB=D5 =D7 Parser/tokenizer.c. --BZaMRJmqxGScZ8Mx Content-Type: application/pgp-signature Content-Disposition: inline -----BEGIN PGP SIGNATURE----- Version: GnuPG v1.4.7 (GNU/Linux) iD8DBQFHP4opfBKgtDjnu0YRAoYDAJ46HF314CLUW8YVMGlvhB+zvcqo4wCgvIxV MPFoa8WUUrWB9ZKqjp/FLoU= =qVPK -----END PGP SIGNATURE----- --BZaMRJmqxGScZ8Mx--