Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 1 addition & 0 deletions .gitignore
Original file line number Diff line number Diff line change
Expand Up @@ -2,6 +2,7 @@
__pycache__/
*.py[cod]
*$py.class
.pytest_cache

# C extensions
*.so
Expand Down
3 changes: 3 additions & 0 deletions .travis.yml
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,9 @@ python:
- '3.6'
install:
- pip install ".[testing]"
- pip install ".[nlp]"
- pip install ".[s3driver]"
- python -m nltk.downloader punkt stopwords wordnet
script: pytest
deploy:
provider: pypi
Expand Down
7 changes: 5 additions & 2 deletions quantgov/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -3,11 +3,14 @@

__all__ = [
'corpora',
'corpus',
'estimator',
'project',
'utils',
]

from .corpora.utils import load_driver
from . import corpora # Backwards compatibility

__version__ = '0.3.3'
from .utils import load_driver

__version__ = '0.4.0'
11 changes: 7 additions & 4 deletions quantgov/__main__.py
Original file line number Diff line number Diff line change
Expand Up @@ -15,7 +15,7 @@
import requests

import quantgov
import quantgov.corpora.builtins
import quantgov.corpus.builtins

from pathlib import Path

Expand All @@ -40,7 +40,7 @@ def parse_args():
# Corpus command
corpus = subparsers.add_parser('corpus')
corpus_subcommands = corpus.add_subparsers(dest='subcommand')
for command, builtin in quantgov.corpora.builtins.commands.items():
for command, builtin in quantgov.corpus.builtins.commands.items():
subcommand = corpus_subcommands.add_parser(
command, help=builtin.cli.help)
subcommand.add_argument(
Expand Down Expand Up @@ -118,6 +118,9 @@ def parse_args():
estimate.add_argument(
'--probability', action='store_true',
help='output probabilities instead of predictions')
estimate.add_argument(
'--precision', default=4, type=int,
help='number of decimal places to round the probabilities')
estimate.add_argument(
'-o', '--outfile',
type=lambda x: open(x, 'w', newline='', encoding='utf-8'),
Expand Down Expand Up @@ -161,7 +164,7 @@ def start_component(args):
def run_corpus_builtin(args):
driver = quantgov.load_driver(args.corpus)
writer = csv.writer(args.outfile)
builtin = quantgov.corpora.builtins.commands[args.subcommand]
builtin = quantgov.corpus.builtins.commands[args.subcommand]
func_args = {i: j for i, j in vars(args).items()
if i not in {'command', 'subcommand', 'outfile', 'corpus'}}
writer.writerow(driver.index_labels + builtin.get_columns(func_args))
Expand All @@ -187,7 +190,7 @@ def run_estimator(args):
elif args.subcommand == "estimate":
quantgov.estimator.estimate(
args.vectorizer, args.model, args.corpus, args.probability,
args.outfile
args.precision, args.outfile
)


Expand Down
13 changes: 11 additions & 2 deletions quantgov/corpora/__init__.py
Original file line number Diff line number Diff line change
@@ -1,9 +1,18 @@
from .structures import (
import warnings

from ..corpus import (
Document,
CorpusStreamer,
CorpusDriver,
FlatFileCorpusDriver,
RecursiveDirectoryCorpusDriver,
NamePatternCorpusDriver,
IndexDriver
IndexDriver,
S3Driver,
S3DatabaseDriver
)

warnings.warn(
("quantgov.corpora has been moved to quantgov.corpus and will be removed"
" in a future version."),
DeprecationWarning)
95 changes: 0 additions & 95 deletions quantgov/corpora/builtins.py

This file was deleted.

16 changes: 0 additions & 16 deletions quantgov/corpora/utils.py

This file was deleted.

11 changes: 11 additions & 0 deletions quantgov/corpus/__init__.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,11 @@
from .structures import (
Document,
CorpusStreamer,
CorpusDriver,
FlatFileCorpusDriver,
RecursiveDirectoryCorpusDriver,
NamePatternCorpusDriver,
IndexDriver,
S3Driver,
S3DatabaseDriver
)
Loading