@@ -250,117 +250,3 @@ def test_na_values_keep_default(self):
250
250
'Three' : ['None' , 'two' , 'None' , 'nan' , 'five' , '' ,
251
251
'seven' ]})
252
252
tm .assert_frame_equal (xp .reindex (columns = df .columns ), df )
253
-
254
- def test_skiprow_with_newline (self ):
255
- # see gh-12775 and gh-10911
256
- data = """id,text,num_lines
257
- 1,"line 11
258
- line 12",2
259
- 2,"line 21
260
- line 22",2
261
- 3,"line 31",1"""
262
- expected = [[2 , 'line 21\n line 22' , 2 ],
263
- [3 , 'line 31' , 1 ]]
264
- expected = DataFrame (expected , columns = [
265
- 'id' , 'text' , 'num_lines' ])
266
- df = self .read_csv (StringIO (data ), skiprows = [1 ])
267
- tm .assert_frame_equal (df , expected )
268
-
269
- data = ('a,b,c\n ~a\n b~,~e\n d~,'
270
- '~f\n f~\n 1,2,~12\n 13\n 14~' )
271
- expected = [['a\n b' , 'e\n d' , 'f\n f' ]]
272
- expected = DataFrame (expected , columns = [
273
- 'a' , 'b' , 'c' ])
274
- df = self .read_csv (StringIO (data ),
275
- quotechar = "~" ,
276
- skiprows = [2 ])
277
- tm .assert_frame_equal (df , expected )
278
-
279
- data = ('Text,url\n ~example\n '
280
- 'sentence\n one~,url1\n ~'
281
- 'example\n sentence\n two~,url2\n ~'
282
- 'example\n sentence\n three~,url3' )
283
- expected = [['example\n sentence\n two' , 'url2' ]]
284
- expected = DataFrame (expected , columns = [
285
- 'Text' , 'url' ])
286
- df = self .read_csv (StringIO (data ),
287
- quotechar = "~" ,
288
- skiprows = [1 , 3 ])
289
- tm .assert_frame_equal (df , expected )
290
-
291
- def test_skiprow_with_quote (self ):
292
- # see gh-12775 and gh-10911
293
- data = """id,text,num_lines
294
- 1,"line '11' line 12",2
295
- 2,"line '21' line 22",2
296
- 3,"line '31' line 32",1"""
297
- expected = [[2 , "line '21' line 22" , 2 ],
298
- [3 , "line '31' line 32" , 1 ]]
299
- expected = DataFrame (expected , columns = [
300
- 'id' , 'text' , 'num_lines' ])
301
- df = self .read_csv (StringIO (data ), skiprows = [1 ])
302
- tm .assert_frame_equal (df , expected )
303
-
304
- def test_skiprow_with_newline_and_quote (self ):
305
- # see gh-12775 and gh-10911
306
- data = """id,text,num_lines
307
- 1,"line \n '11' line 12",2
308
- 2,"line \n '21' line 22",2
309
- 3,"line \n '31' line 32",1"""
310
- expected = [[2 , "line \n '21' line 22" , 2 ],
311
- [3 , "line \n '31' line 32" , 1 ]]
312
- expected = DataFrame (expected , columns = [
313
- 'id' , 'text' , 'num_lines' ])
314
- df = self .read_csv (StringIO (data ), skiprows = [1 ])
315
- tm .assert_frame_equal (df , expected )
316
-
317
- data = """id,text,num_lines
318
- 1,"line '11\n ' line 12",2
319
- 2,"line '21\n ' line 22",2
320
- 3,"line '31\n ' line 32",1"""
321
- expected = [[2 , "line '21\n ' line 22" , 2 ],
322
- [3 , "line '31\n ' line 32" , 1 ]]
323
- expected = DataFrame (expected , columns = [
324
- 'id' , 'text' , 'num_lines' ])
325
- df = self .read_csv (StringIO (data ), skiprows = [1 ])
326
- tm .assert_frame_equal (df , expected )
327
-
328
- data = """id,text,num_lines
329
- 1,"line '11\n ' \r \t line 12",2
330
- 2,"line '21\n ' \r \t line 22",2
331
- 3,"line '31\n ' \r \t line 32",1"""
332
- expected = [[2 , "line '21\n ' \r \t line 22" , 2 ],
333
- [3 , "line '31\n ' \r \t line 32" , 1 ]]
334
- expected = DataFrame (expected , columns = [
335
- 'id' , 'text' , 'num_lines' ])
336
- df = self .read_csv (StringIO (data ), skiprows = [1 ])
337
- tm .assert_frame_equal (df , expected )
338
-
339
- def test_skiprows_lineterminator (self ):
340
- # see gh-9079
341
- data = '\n ' .join (['SMOSMANIA ThetaProbe-ML2X ' ,
342
- '2007/01/01 01:00 0.2140 U M ' ,
343
- '2007/01/01 02:00 0.2141 M O ' ,
344
- '2007/01/01 04:00 0.2142 D M ' ])
345
- expected = DataFrame ([['2007/01/01' , '01:00' , 0.2140 , 'U' , 'M' ],
346
- ['2007/01/01' , '02:00' , 0.2141 , 'M' , 'O' ],
347
- ['2007/01/01' , '04:00' , 0.2142 , 'D' , 'M' ]],
348
- columns = ['date' , 'time' , 'var' , 'flag' ,
349
- 'oflag' ])
350
-
351
- # test with default line terminators "LF" and "CRLF"
352
- df = self .read_csv (StringIO (data ), skiprows = 1 , delim_whitespace = True ,
353
- names = ['date' , 'time' , 'var' , 'flag' , 'oflag' ])
354
- tm .assert_frame_equal (df , expected )
355
-
356
- df = self .read_csv (StringIO (data .replace ('\n ' , '\r \n ' )),
357
- skiprows = 1 , delim_whitespace = True ,
358
- names = ['date' , 'time' , 'var' , 'flag' , 'oflag' ])
359
- tm .assert_frame_equal (df , expected )
360
-
361
- # "CR" is not respected with the Python parser yet
362
- if self .engine == 'c' :
363
- df = self .read_csv (StringIO (data .replace ('\n ' , '\r ' )),
364
- skiprows = 1 , delim_whitespace = True ,
365
- names = ['date' , 'time' , 'var' , 'flag' , 'oflag' ])
366
- tm .assert_frame_equal (df , expected )
0 commit comments