@@ -223,117 +223,3 @@ def test_na_values_keep_default(self):
223
223
'Three' : ['None' , 'two' , 'None' , 'nan' , 'five' , '' ,
224
224
'seven' ]})
225
225
tm .assert_frame_equal (xp .reindex (columns = df .columns ), df )
226
-
227
- def test_skiprow_with_newline (self ):
228
- # see gh-12775 and gh-10911
229
- data = """id,text,num_lines
230
- 1,"line 11
231
- line 12",2
232
- 2,"line 21
233
- line 22",2
234
- 3,"line 31",1"""
235
- expected = [[2 , 'line 21\n line 22' , 2 ],
236
- [3 , 'line 31' , 1 ]]
237
- expected = DataFrame (expected , columns = [
238
- 'id' , 'text' , 'num_lines' ])
239
- df = self .read_csv (StringIO (data ), skiprows = [1 ])
240
- tm .assert_frame_equal (df , expected )
241
-
242
- data = ('a,b,c\n ~a\n b~,~e\n d~,'
243
- '~f\n f~\n 1,2,~12\n 13\n 14~' )
244
- expected = [['a\n b' , 'e\n d' , 'f\n f' ]]
245
- expected = DataFrame (expected , columns = [
246
- 'a' , 'b' , 'c' ])
247
- df = self .read_csv (StringIO (data ),
248
- quotechar = "~" ,
249
- skiprows = [2 ])
250
- tm .assert_frame_equal (df , expected )
251
-
252
- data = ('Text,url\n ~example\n '
253
- 'sentence\n one~,url1\n ~'
254
- 'example\n sentence\n two~,url2\n ~'
255
- 'example\n sentence\n three~,url3' )
256
- expected = [['example\n sentence\n two' , 'url2' ]]
257
- expected = DataFrame (expected , columns = [
258
- 'Text' , 'url' ])
259
- df = self .read_csv (StringIO (data ),
260
- quotechar = "~" ,
261
- skiprows = [1 , 3 ])
262
- tm .assert_frame_equal (df , expected )
263
-
264
- def test_skiprow_with_quote (self ):
265
- # see gh-12775 and gh-10911
266
- data = """id,text,num_lines
267
- 1,"line '11' line 12",2
268
- 2,"line '21' line 22",2
269
- 3,"line '31' line 32",1"""
270
- expected = [[2 , "line '21' line 22" , 2 ],
271
- [3 , "line '31' line 32" , 1 ]]
272
- expected = DataFrame (expected , columns = [
273
- 'id' , 'text' , 'num_lines' ])
274
- df = self .read_csv (StringIO (data ), skiprows = [1 ])
275
- tm .assert_frame_equal (df , expected )
276
-
277
- def test_skiprow_with_newline_and_quote (self ):
278
- # see gh-12775 and gh-10911
279
- data = """id,text,num_lines
280
- 1,"line \n '11' line 12",2
281
- 2,"line \n '21' line 22",2
282
- 3,"line \n '31' line 32",1"""
283
- expected = [[2 , "line \n '21' line 22" , 2 ],
284
- [3 , "line \n '31' line 32" , 1 ]]
285
- expected = DataFrame (expected , columns = [
286
- 'id' , 'text' , 'num_lines' ])
287
- df = self .read_csv (StringIO (data ), skiprows = [1 ])
288
- tm .assert_frame_equal (df , expected )
289
-
290
- data = """id,text,num_lines
291
- 1,"line '11\n ' line 12",2
292
- 2,"line '21\n ' line 22",2
293
- 3,"line '31\n ' line 32",1"""
294
- expected = [[2 , "line '21\n ' line 22" , 2 ],
295
- [3 , "line '31\n ' line 32" , 1 ]]
296
- expected = DataFrame (expected , columns = [
297
- 'id' , 'text' , 'num_lines' ])
298
- df = self .read_csv (StringIO (data ), skiprows = [1 ])
299
- tm .assert_frame_equal (df , expected )
300
-
301
- data = """id,text,num_lines
302
- 1,"line '11\n ' \r \t line 12",2
303
- 2,"line '21\n ' \r \t line 22",2
304
- 3,"line '31\n ' \r \t line 32",1"""
305
- expected = [[2 , "line '21\n ' \r \t line 22" , 2 ],
306
- [3 , "line '31\n ' \r \t line 32" , 1 ]]
307
- expected = DataFrame (expected , columns = [
308
- 'id' , 'text' , 'num_lines' ])
309
- df = self .read_csv (StringIO (data ), skiprows = [1 ])
310
- tm .assert_frame_equal (df , expected )
311
-
312
- def test_skiprows_lineterminator (self ):
313
- # see gh-9079
314
- data = '\n ' .join (['SMOSMANIA ThetaProbe-ML2X ' ,
315
- '2007/01/01 01:00 0.2140 U M ' ,
316
- '2007/01/01 02:00 0.2141 M O ' ,
317
- '2007/01/01 04:00 0.2142 D M ' ])
318
- expected = DataFrame ([['2007/01/01' , '01:00' , 0.2140 , 'U' , 'M' ],
319
- ['2007/01/01' , '02:00' , 0.2141 , 'M' , 'O' ],
320
- ['2007/01/01' , '04:00' , 0.2142 , 'D' , 'M' ]],
321
- columns = ['date' , 'time' , 'var' , 'flag' ,
322
- 'oflag' ])
323
-
324
- # test with default line terminators "LF" and "CRLF"
325
- df = self .read_csv (StringIO (data ), skiprows = 1 , delim_whitespace = True ,
326
- names = ['date' , 'time' , 'var' , 'flag' , 'oflag' ])
327
- tm .assert_frame_equal (df , expected )
328
-
329
- df = self .read_csv (StringIO (data .replace ('\n ' , '\r \n ' )),
330
- skiprows = 1 , delim_whitespace = True ,
331
- names = ['date' , 'time' , 'var' , 'flag' , 'oflag' ])
332
- tm .assert_frame_equal (df , expected )
333
-
334
- # "CR" is not respected with the Python parser yet
335
- if self .engine == 'c' :
336
- df = self .read_csv (StringIO (data .replace ('\n ' , '\r ' )),
337
- skiprows = 1 , delim_whitespace = True ,
338
- names = ['date' , 'time' , 'var' , 'flag' , 'oflag' ])
339
- tm .assert_frame_equal (df , expected )
0 commit comments