NotificationsYou must be signed in to change notification settings
Fork11.9k
Star31k

Commitf59a423

authored

Merge pull request#10536 from eric-wieser/fix-10394

BUG: Resize bytes_ columns in genfromtxt (backport of#10401)

2 parents54abb9a +0a87861 commitf59a423Copy full SHA for f59a423

File tree

2 files changed

+27

-17

lines changed

numpy/lib
- npyio.py
- tests
  - test_io.py

2 files changed

+27

-17

lines changed

`‎numpy/lib/npyio.py‎`

Lines changed: 20 additions & 17 deletions

Original file line number	Diff line number	Diff line change
`@@ -2042,7 +2042,6 @@ def tobytes_first(x, conv):`
`2042`	`2042`	`strcolidx= [ifor (i,v)inenumerate(column_types)`
`2043`	`2043`	`ifv==np.unicode_]`
`2044`	`2044`
`2045`		`-type_str=np.unicode_`
`2046`	`2045`	`ifbyte_convertersandstrcolidx:`
`2047`	`2046`	`# convert strings back to bytes for backward compatibility`
`2048`	`2047`	`warnings.warn(`
`@@ -2058,33 +2057,37 @@ def encode_unicode_cols(row_tup):`
`2058`	`2057`
`2059`	`2058`	`try:`
`2060`	`2059`	`data= [encode_unicode_cols(r)forrindata]`
`2061`		`-type_str=np.bytes_`
`2062`	`2060`	`exceptUnicodeEncodeError:`
`2063`	`2061`	`pass`
	`2062`	`+else:`
	`2063`	`+foriinstrcolidx:`
	`2064`	`+column_types[i]=np.bytes_`
`2064`	`2065`
	`2066`	`+# Update string types to be the right length`
	`2067`	`+sized_column_types=column_types[:]`
	`2068`	`+fori,col_typeinenumerate(column_types):`
	`2069`	`+ifnp.issubdtype(col_type,np.character):`
	`2070`	`+n_chars=max(len(row[i])forrowindata)`
	`2071`	`+sized_column_types[i]= (col_type,n_chars)`
`2065`	`2072`
`2066`		`-# ... and take the largest number of chars.`
`2067`		`-foriinstrcolidx:`
`2068`		`-max_line_length=max(len(row[i])forrowindata)`
`2069`		`-column_types[i]=np.dtype((type_str,max_line_length))`
`2070`		`-#`
`2071`	`2073`	`ifnamesisNone:`
`2072`		`-# If the dtype is uniform, don't define names, else use ''`
`2073`		`-base=set([c.typeforcinconvertersifc._checked])`
	`2074`	`+# If the dtype is uniform (before sizing strings)`
	`2075`	`+base=set([`
	`2076`	`+c_type`
	`2077`	`+forc,c_typeinzip(converters,column_types)`
	`2078`	`+ifc._checked])`
`2074`	`2079`	`iflen(base)==1:`
`2075`		`-ifstrcolidx:`
`2076`		`- (ddtype,mdtype)= (type_str,bool)`
`2077`		`-else:`
`2078`		`- (ddtype,mdtype)= (list(base)[0],bool)`
	`2080`	`+uniform_type,=base`
	`2081`	`+ (ddtype,mdtype)= (uniform_type,bool)`
`2079`	`2082`	`else:`
`2080`	`2083`	`ddtype= [(defaultfmt%i,dt)`
`2081`		`-for (i,dt)inenumerate(column_types)]`
	`2084`	`+for (i,dt)inenumerate(sized_column_types)]`
`2082`	`2085`	`ifusemask:`
`2083`	`2086`	`mdtype= [(defaultfmt%i,bool)`
`2084`		`-for (i,dt)inenumerate(column_types)]`
	`2087`	`+for (i,dt)inenumerate(sized_column_types)]`
`2085`	`2088`	`else:`
`2086`		`-ddtype=list(zip(names,column_types))`
`2087`		`-mdtype=list(zip(names, [bool]*len(column_types)))`
	`2089`	`+ddtype=list(zip(names,sized_column_types))`
	`2090`	`+mdtype=list(zip(names, [bool]*len(sized_column_types)))`
`2088`	`2091`	`output=np.array(data,dtype=ddtype)`
`2089`	`2092`	`ifusemask:`
`2090`	`2093`	`outputmask=np.array(masks,dtype=mdtype)`

`‎numpy/lib/tests/test_io.py‎`

Lines changed: 7 additions & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -2056,6 +2056,13 @@ def test_recfromcsv(self):`
`2056`	`2056`	`assert_(isinstance(test,np.recarray))`
`2057`	`2057`	`assert_equal(test,control)`
`2058`	`2058`
	`2059`	`+#gh-10394`
	`2060`	`+data=TextIO('color\n"red"\n"blue"')`
	`2061`	`+test=np.recfromcsv(data,converters={0:lambdax:x.strip(b'\"')})`
	`2062`	`+control=np.array([('red',), ('blue',)],dtype=[('color', (bytes,4))])`
	`2063`	`+assert_equal(test.dtype,control.dtype)`
	`2064`	`+assert_equal(test,control)`
	`2065`	`+`
`2059`	`2066`	`deftest_max_rows(self):`
`2060`	`2067`	# Test the `max_rows` keyword argument.
`2061`	`2068`	`data='1 2\n3 4\n5 6\n7 8\n9 10\n'`

0 commit comments

Comments

(0)

Movatterモバイル変換

Navigation Menu

Search code, repositories, users, issues, pull requests...

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Uh oh!

Commitf59a423

File tree

2 files changed

2 files changed

`‎numpy/lib/npyio.py‎`

`‎numpy/lib/tests/test_io.py‎`

0 commit comments