cubicweb: comparison dataimport/csv.py

equal deleted inserted replaced

-:bd98cd3b7869
+:bb0c7dbd1fe7
 # You should have received a copy of the GNU Lesser General Public License along
 # with CubicWeb.  If not, see <http://www.gnu.org/licenses/>.
 """Functions to help importing CSV data"""
 from __future__ import absolute_import, print_function
+import codecs
 import csv as csvmod
 import warnings
 import os.path as osp
-from six import string_types
+from six import PY2, PY3, string_types
 from logilab.common import shellutils
 def count_lines(stream_or_filename):
 warnings.warn("[3.20] 'separator' kwarg is deprecated, use 'delimiter' instead")
 if quote is not None:
 quotechar = quote
 warnings.warn("[3.20] 'quote' kwarg is deprecated, use 'quotechar' instead")
 if isinstance(stream_or_path, string_types):
-if not osp.exists(stream_or_path):
+stream = open(stream_or_path, 'rb')
-raise Exception("file doesn't exists: %s" % stream_or_path)
-stream = open(stream_or_path)
 else:
 stream = stream_or_path
 rowcount = count_lines(stream)
 if skipfirst:
 rowcount -= 1
 if skip_empty (the default), lines without any values specified (only
 separators) will be skipped. This is useful for Excel exports which may be
 full of such lines.
 """
+if PY3:
+stream = codecs.getreader(encoding)(stream)
 if separator is not None:
 delimiter = separator
 warnings.warn("[3.20] 'separator' kwarg is deprecated, use 'delimiter' instead")
 if quote is not None:
 quotechar = quote
 it = iter(csvmod.reader(stream, delimiter=delimiter, quotechar=quotechar))
 if not ignore_errors:
 if skipfirst:
 next(it)
 for row in it:
-decoded = [item.decode(encoding) for item in row]
+if PY2:
+decoded = [item.decode(encoding) for item in row]
+else:
+decoded = row
 if not skip_empty or any(decoded):
 yield decoded
 else:
 if skipfirst:
 try:
 except StopIteration:
 break
 # Error in CSV, ignore line and continue
 except csvmod.Error:
 continue
-decoded = [item.decode(encoding) for item in row]
+if PY2:
+decoded = [item.decode(encoding) for item in row]
+else:
+decoded = row
 if not skip_empty or any(decoded):
 yield decoded

changeset 10807	bb0c7dbd1fe7
parent 10669	155c29e0ed1c
child 10907	9ae707db5265