Skip to content

Commit

Permalink
fix: Add glob, user dir and env var support on Windows #634
Browse files Browse the repository at this point in the history
  • Loading branch information
jpmckinney committed Jul 13, 2024
1 parent 0166197 commit 6973dfd
Show file tree
Hide file tree
Showing 5 changed files with 72 additions and 0 deletions.
1 change: 1 addition & 0 deletions CHANGELOG.rst
Original file line number Diff line number Diff line change
Expand Up @@ -6,6 +6,7 @@ Unreleased
- feat: Add a Docker image.
- feat: Add man pages to the sdist and wheel distributions.
- fix: :doc:`/scripts/csvstat` no longer errors when a column is a time delta and :code:`--json` is set.
- fix: When taking arguments from ``sys.argv`` on Windows, glob patterns, user directories, and environment variables are expanded.

2.0.0 - May 1, 2024
-------------------
Expand Down
29 changes: 29 additions & 0 deletions csvkit/cli.py
Original file line number Diff line number Diff line change
Expand Up @@ -7,8 +7,11 @@
import gzip
import itertools
import lzma
import os
import re
import sys
import warnings
from glob import glob
from os.path import splitext

import agate
Expand Down Expand Up @@ -73,6 +76,11 @@ def __init__(self, args=None, output_file=None, error_file=None):
"""
Perform argument processing and other setup for a CSVKitUtility.
"""
if args is None:
args = sys.argv[1:]
if os.name == 'nt':
args = _expand_args(args)

self._init_common_parser()
self.add_arguments()
self.args = self.argparser.parse_args(args)
Expand Down Expand Up @@ -550,3 +558,24 @@ def parse_column_identifiers(ids, column_names, column_offset=1, excluded_column
excludes.append(match_column_identifier(column_names, x, column_offset))

return [c for c in columns if c not in excludes]


# Adapted from https://github.com/pallets/click/blame/main/src/click/utils.py
def _expand_args(args):
out = []

for arg in args:
arg = os.path.expanduser(arg)
arg = os.path.expandvars(arg)

try:
matches = glob(arg, recursive=True)
except re.error:
matches = []

if matches:
out.extend(matches)
else:
out.append(arg)

return out
10 changes: 10 additions & 0 deletions tests/test_utilities/test_csvjoin.py
Original file line number Diff line number Diff line change
@@ -1,4 +1,6 @@
import os
import sys
import unittest
from unittest.mock import patch

from csvkit.utilities.csvjoin import CSVJoin, launch_new_instance
Expand Down Expand Up @@ -34,6 +36,14 @@ def test_join_options(self):
'You must provide join column names when performing an outer join.',
)

@unittest.skipIf(os.name != 'nt', 'Windows only')
def test_glob(self):
self.assertRows(['--no-inference', '-c', 'a', 'examples/dummy?.csv'], [
['a', 'b', 'c', 'b2', 'c2'],
['1', '2', '3', '2', '3'],
['1', '2', '3', '4', '5'],
])

def test_sequential(self):
output = self.get_output_as_io(['examples/join_a.csv', 'examples/join_b.csv'])
self.assertEqual(len(output.readlines()), 4)
Expand Down
18 changes: 18 additions & 0 deletions tests/test_utilities/test_csvsql.py
Original file line number Diff line number Diff line change
@@ -1,6 +1,7 @@
import io
import os
import sys
import unittest
from textwrap import dedent
from unittest.mock import patch

Expand Down Expand Up @@ -63,6 +64,23 @@ def tearDown(self):
if os.path.exists(self.db_file):
os.remove(self.db_file)

@unittest.skipIf(os.name != 'nt', 'Windows only')
def test_glob(self):
sql = self.get_output(['examples/dummy*.csv'])

self.assertEqual(sql.replace('\t', ' '), dedent('''\
CREATE TABLE dummy2 (
a BOOLEAN NOT NULL,
b DECIMAL NOT NULL,
c DECIMAL NOT NULL
);
CREATE TABLE dummy3 (
a BOOLEAN NOT NULL,
b DECIMAL NOT NULL,
c DECIMAL NOT NULL
);
''')) # noqa: W291

def test_create_table(self):
sql = self.get_output(['--tables', 'foo', 'examples/testfixed_converted.csv'])

Expand Down
14 changes: 14 additions & 0 deletions tests/test_utilities/test_csvstack.py
Original file line number Diff line number Diff line change
@@ -1,4 +1,6 @@
import os
import sys
import unittest
from unittest.mock import patch

from csvkit.utilities.csvstack import CSVStack, launch_new_instance
Expand All @@ -20,6 +22,18 @@ def test_options(self):
'The number of grouping values must be equal to the number of CSV files being stacked.',
)

@unittest.skipIf(os.name != 'nt', 'Windows only')
def test_glob(self):
self.assertRows(['examples/dummy*.csv'], [
['a', 'b', 'c', 'd'],
['1', '2', '3', ''],
['1', '2', '3', ''],
['1', '2', '3', ''],
['1', '4', '5', ''],
['1', '2', '3', ''],
['1', '2', '3', '4'],
])

def test_skip_lines(self):
self.assertRows(['--skip-lines', '3', 'examples/test_skip_lines.csv', 'examples/test_skip_lines.csv'], [
['a', 'b', 'c'],
Expand Down

0 comments on commit 6973dfd

Please sign in to comment.