diff --git a/.dvc/.gitignore b/.dvc/.gitignore new file mode 100755 index 0000000..528f30c --- /dev/null +++ b/.dvc/.gitignore @@ -0,0 +1,3 @@ +/config.local +/tmp +/cache diff --git a/.dvc/config b/.dvc/config new file mode 100755 index 0000000..e69de29 diff --git a/.dvc/plots/confusion.json b/.dvc/plots/confusion.json new file mode 100755 index 0000000..af1b48d --- /dev/null +++ b/.dvc/plots/confusion.json @@ -0,0 +1,107 @@ +{ + "$schema": "https://vega.github.io/schema/vega-lite/v4.json", + "data": { + "values": "" + }, + "title": "", + "facet": { + "field": "rev", + "type": "nominal" + }, + "spec": { + "transform": [ + { + "aggregate": [ + { + "op": "count", + "as": "xy_count" + } + ], + "groupby": [ + "", + "" + ] + }, + { + "impute": "xy_count", + "groupby": [ + "rev", + "" + ], + "key": "", + "value": 0 + }, + { + "impute": "xy_count", + "groupby": [ + "rev", + "" + ], + "key": "", + "value": 0 + }, + { + "joinaggregate": [ + { + "op": "max", + "field": "xy_count", + "as": "max_count" + } + ], + "groupby": [] + }, + { + "calculate": "datum.xy_count / datum.max_count", + "as": "percent_of_max" + } + ], + "encoding": { + "x": { + "field": "", + "type": "nominal", + "sort": "ascending", + "title": "" + }, + "y": { + "field": "", + "type": "nominal", + "sort": "ascending", + "title": "" + } + }, + "layer": [ + { + "mark": "rect", + "width": 300, + "height": 300, + "encoding": { + "color": { + "field": "xy_count", + "type": "quantitative", + "title": "", + "scale": { + "domainMin": 0, + "nice": true + } + } + } + }, + { + "mark": "text", + "encoding": { + "text": { + "field": "xy_count", + "type": "quantitative" + }, + "color": { + "condition": { + "test": "datum.percent_of_max > 0.5", + "value": "white" + }, + "value": "black" + } + } + } + ] + } +} diff --git a/.dvc/plots/confusion_normalized.json b/.dvc/plots/confusion_normalized.json new file mode 100755 index 0000000..1d38849 --- /dev/null +++ b/.dvc/plots/confusion_normalized.json @@ -0,0 +1,112 @@ +{ + "$schema": "https://vega.github.io/schema/vega-lite/v4.json", + "data": { + "values": "" + }, + "title": "", + "facet": { + "field": "rev", + "type": "nominal" + }, + "spec": { + "transform": [ + { + "aggregate": [ + { + "op": "count", + "as": "xy_count" + } + ], + "groupby": [ + "", + "" + ] + }, + { + "impute": "xy_count", + "groupby": [ + "rev", + "" + ], + "key": "", + "value": 0 + }, + { + "impute": "xy_count", + "groupby": [ + "rev", + "" + ], + "key": "", + "value": 0 + }, + { + "joinaggregate": [ + { + "op": "sum", + "field": "xy_count", + "as": "sum_y" + } + ], + "groupby": [ + "" + ] + }, + { + "calculate": "datum.xy_count / datum.sum_y", + "as": "percent_of_y" + } + ], + "encoding": { + "x": { + "field": "", + "type": "nominal", + "sort": "ascending", + "title": "" + }, + "y": { + "field": "", + "type": "nominal", + "sort": "ascending", + "title": "" + } + }, + "layer": [ + { + "mark": "rect", + "width": 300, + "height": 300, + "encoding": { + "color": { + "field": "percent_of_y", + "type": "quantitative", + "title": "", + "scale": { + "domain": [ + 0, + 1 + ] + } + } + } + }, + { + "mark": "text", + "encoding": { + "text": { + "field": "percent_of_y", + "type": "quantitative", + "format": ".2f" + }, + "color": { + "condition": { + "test": "datum.percent_of_y > 0.5", + "value": "white" + }, + "value": "black" + } + } + } + ] + } +} diff --git a/.dvc/plots/default.json b/.dvc/plots/default.json new file mode 100755 index 0000000..9cf71ce --- /dev/null +++ b/.dvc/plots/default.json @@ -0,0 +1,31 @@ +{ + "$schema": "https://vega.github.io/schema/vega-lite/v4.json", + "data": { + "values": "" + }, + "title": "", + "width": 300, + "height": 300, + "mark": { + "type": "line" + }, + "encoding": { + "x": { + "field": "", + "type": "quantitative", + "title": "" + }, + "y": { + "field": "", + "type": "quantitative", + "title": "", + "scale": { + "zero": false + } + }, + "color": { + "field": "rev", + "type": "nominal" + } + } +} diff --git a/.dvc/plots/linear.json b/.dvc/plots/linear.json new file mode 100755 index 0000000..65549f9 --- /dev/null +++ b/.dvc/plots/linear.json @@ -0,0 +1,116 @@ +{ + "$schema": "https://vega.github.io/schema/vega-lite/v4.json", + "data": { + "values": "" + }, + "title": "", + "width": 300, + "height": 300, + "layer": [ + { + "encoding": { + "x": { + "field": "", + "type": "quantitative", + "title": "" + }, + "y": { + "field": "", + "type": "quantitative", + "title": "", + "scale": { + "zero": false + } + }, + "color": { + "field": "rev", + "type": "nominal" + } + }, + "layer": [ + { + "mark": "line" + }, + { + "selection": { + "label": { + "type": "single", + "nearest": true, + "on": "mouseover", + "encodings": [ + "x" + ], + "empty": "none", + "clear": "mouseout" + } + }, + "mark": "point", + "encoding": { + "opacity": { + "condition": { + "selection": "label", + "value": 1 + }, + "value": 0 + } + } + } + ] + }, + { + "transform": [ + { + "filter": { + "selection": "label" + } + } + ], + "layer": [ + { + "mark": { + "type": "rule", + "color": "gray" + }, + "encoding": { + "x": { + "field": "", + "type": "quantitative" + } + } + }, + { + "encoding": { + "text": { + "type": "quantitative", + "field": "" + }, + "x": { + "field": "", + "type": "quantitative" + }, + "y": { + "field": "", + "type": "quantitative" + } + }, + "layer": [ + { + "mark": { + "type": "text", + "align": "left", + "dx": 5, + "dy": -5 + }, + "encoding": { + "color": { + "type": "nominal", + "field": "rev" + } + } + } + ] + } + ] + } + ] +} diff --git a/.dvc/plots/scatter.json b/.dvc/plots/scatter.json new file mode 100755 index 0000000..9af9304 --- /dev/null +++ b/.dvc/plots/scatter.json @@ -0,0 +1,104 @@ +{ + "$schema": "https://vega.github.io/schema/vega-lite/v4.json", + "data": { + "values": "" + }, + "title": "", + "width": 300, + "height": 300, + "layer": [ + { + "encoding": { + "x": { + "field": "", + "type": "quantitative", + "title": "" + }, + "y": { + "field": "", + "type": "quantitative", + "title": "", + "scale": { + "zero": false + } + }, + "color": { + "field": "rev", + "type": "nominal" + } + }, + "layer": [ + { + "mark": "point" + }, + { + "selection": { + "label": { + "type": "single", + "nearest": true, + "on": "mouseover", + "encodings": [ + "x" + ], + "empty": "none", + "clear": "mouseout" + } + }, + "mark": "point", + "encoding": { + "opacity": { + "condition": { + "selection": "label", + "value": 1 + }, + "value": 0 + } + } + } + ] + }, + { + "transform": [ + { + "filter": { + "selection": "label" + } + } + ], + "layer": [ + { + "encoding": { + "text": { + "type": "quantitative", + "field": "" + }, + "x": { + "field": "", + "type": "quantitative" + }, + "y": { + "field": "", + "type": "quantitative" + } + }, + "layer": [ + { + "mark": { + "type": "text", + "align": "left", + "dx": 5, + "dy": -5 + }, + "encoding": { + "color": { + "type": "nominal", + "field": "rev" + } + } + } + ] + } + ] + } + ] +} diff --git a/.dvc/plots/smooth.json b/.dvc/plots/smooth.json new file mode 100755 index 0000000..d497ce7 --- /dev/null +++ b/.dvc/plots/smooth.json @@ -0,0 +1,39 @@ +{ + "$schema": "https://vega.github.io/schema/vega-lite/v4.json", + "data": { + "values": "" + }, + "title": "", + "mark": { + "type": "line" + }, + "encoding": { + "x": { + "field": "", + "type": "quantitative", + "title": "" + }, + "y": { + "field": "", + "type": "quantitative", + "title": "", + "scale": { + "zero": false + } + }, + "color": { + "field": "rev", + "type": "nominal" + } + }, + "transform": [ + { + "loess": "", + "on": "", + "groupby": [ + "rev" + ], + "bandwidth": 0.3 + } + ] +} diff --git a/.dvcignore b/.dvcignore new file mode 100755 index 0000000..5197305 --- /dev/null +++ b/.dvcignore @@ -0,0 +1,3 @@ +# Add patterns of files dvc should ignore, which could improve +# the performance. Learn more at +# https://dvc.org/doc/user-guide/dvcignore diff --git a/environment.yml b/environment.yml index 00b25ae..f62eca1 100644 --- a/environment.yml +++ b/environment.yml @@ -19,9 +19,11 @@ dependencies: - astor=0.8.1=py39h06a4308_0 - astunparse=1.6.3=py_0 - async-timeout=3.0.1=py39h06a4308_0 + - atpublic=1.0=py_0 - attrs=21.2.0=pyhd3eb1b0_0 - blas=1.0=mkl - blinker=1.4=py39h06a4308_0 + - bzip2=1.0.8=h7b6447c_0 - c-ares=1.17.1=h27cfd23_0 - ca-certificates=2021.5.25=h06a4308_1 - cached-property=1.5.2=py_0 @@ -31,6 +33,9 @@ dependencies: - chardet=3.0.4=py39h06a4308_1003 - click=8.0.1=pyhd3eb1b0_0 - cloudpickle=1.6.0=py_0 + - colorama=0.4.4=pyhd3eb1b0_0 + - commonmark=0.9.1=py_0 + - configobj=5.0.6=py39h06a4308_1 - configparser=5.0.2=pyhd3eb1b0_0 - coverage=5.5=py39h27cfd23_2 - cryptography=3.4.7=py39hd23ed53_0 @@ -39,15 +44,28 @@ dependencies: - cython=0.29.23=py39h2531618_0 - databricks-cli=0.9.1=py_0 - dbus=1.13.18=hb2f20db_0 + - decorator=5.0.9=pyhd3eb1b0_0 + - dictdiffer=0.8.1=pyhd8ed1ab_0 + - diskcache=5.2.1=pyh44b312d_0 + - distro=1.5.0=pyhd3eb1b0_1 - docker-py=4.4.1=py39h06a4308_5 - docker-pycreds=0.4.0=py_0 - docopt=0.6.2=py39h06a4308_0 + - dpath=2.0.1=py39hf3d152e_0 + - dulwich=0.20.23=py39h3811e60_0 + - dvc=2.3.0=py39hf3d152e_0 - entrypoints=0.3=py39h06a4308_0 - expat=2.4.1=h2531618_2 - flask=1.1.2=pyhd3eb1b0_0 - flatbuffers=2.0.0=h2531618_0 + - flatten-dict=0.3.0=pyh9f0ad1d_0 + - flufl.lock=3.2=py_0 - fontconfig=2.13.1=h6c09931_0 - freetype=2.10.4=h5ab3b9f_0 + - fsspec=2021.5.0=pyhd8ed1ab_0 + - ftfy=5.8=py_0 + - funcy=1.16=pyhd8ed1ab_0 + - future=0.18.2=py39h06a4308_1 - gast=0.4.0=py_0 - gettext=0.21.0=hf68c758_0 - giflib=5.2.1=h7b6447c_0 @@ -57,6 +75,7 @@ dependencies: - google-auth=1.30.1=pyhd3eb1b0_0 - google-auth-oauthlib=0.4.1=py_2 - google-pasta=0.2.0=py_0 + - grandalf=0.6=py_0 - greenlet=1.1.0=py39h2531618_0 - grpcio=1.36.1=py39h2157cd5_1 - gst-plugins-base=1.18.4=hf529b03_2 @@ -72,6 +91,7 @@ dependencies: - itsdangerous=2.0.1=pyhd3eb1b0_0 - jinja2=3.0.0=pyhd3eb1b0_0 - jpeg=9d=h36c2ea0_0 + - jsonpath-ng=1.5.2=pyh9f0ad1d_0 - jsonpickle=2.0.0=pyhd3eb1b0_0 - kaggle=1.5.12=py39hf3d152e_0 - keras-preprocessing=1.1.2=pyhd3eb1b0_0 @@ -88,6 +108,7 @@ dependencies: - libgcc-ng=9.3.0=h5101ec6_17 - libgfortran-ng=7.5.0=ha8ba4b0_17 - libgfortran4=7.5.0=ha8ba4b0_17 + - libgit2=1.1.0=h0b03e73_0 - libglib=2.68.2=h3e27bee_0 - libgomp=9.3.0=h5101ec6_17 - libiconv=1.16=h516909a_0 @@ -109,6 +130,7 @@ dependencies: - libxkbcommon=1.0.3=he3ba5ed_0 - libxml2=2.9.12=h72842e0_0 - lz4-c=1.9.3=h2531618_0 + - mailchecker=4.0.8=pyhd8ed1ab_0 - mako=1.1.4=pyhd3eb1b0_0 - markdown=3.3.4=py39h06a4308_0 - markupsafe=2.0.1=py39h27cfd23_0 @@ -123,7 +145,9 @@ dependencies: - munch=2.5.0=py_0 - mysql-common=8.0.25=ha770c72_0 - mysql-libs=8.0.25=h935591d_0 + - nanotime=0.5.2=py_0 - ncurses=6.2=he6710b0_1 + - networkx=2.5=py_0 - ninja=1.10.2=hff7bd54_1 - nspr=4.30=h9c3ff4c_0 - nss=3.64=hb5efdd6_0 @@ -135,16 +159,26 @@ dependencies: - opt_einsum=3.3.0=pyhd3eb1b0_1 - packaging=20.9=pyhd3eb1b0_0 - pandas=1.2.4=py39h2531618_0 + - pathlib2=2.3.5=py39h06a4308_2 + - pathspec=0.7.0=py_0 - pcre=8.44=he6710b0_0 + - pcre2=10.35=h14c3975_1 + - phonenumbers=8.12.24=pyhd3eb1b0_0 - pillow=8.2.0=py39he98fc37_0 - pip=21.1.2=py39h06a4308_0 + - ply=3.11=py39h06a4308_0 - prometheus_client=0.11.0=pyhd3eb1b0_0 - prometheus_flask_exporter=0.18.2=pyhd8ed1ab_0 - protobuf=3.14.0=py39h2531618_1 + - psutil=5.8.0=py39h27cfd23_1 - py-cpuinfo=8.0.0=pyhd3eb1b0_0 - pyasn1=0.4.8=py_0 - pyasn1-modules=0.2.8=py_0 - pycparser=2.20=py_2 + - pydot=1.2.4=py_0 + - pygit2=1.6.0=py39h3811e60_0 + - pygments=2.9.0=pyhd3eb1b0_0 + - pygtrie=2.3.2=pyh8c360ce_0 - pyjwt=2.1.0=py39h06a4308_0 - pymongo=3.11.4=py39h2531618_0 - pyopenssl=20.0.1=pyhd3eb1b0_1 @@ -156,9 +190,11 @@ dependencies: - pyqtwebengine=5.12.1=py39h0fcd23e_7 - pysocks=1.7.1=py39h06a4308_0 - python=3.9.5=h12debd9_4 + - python-benedict=0.24.0=pyhd8ed1ab_0 - python-dateutil=2.8.1=pyhd3eb1b0_0 - python-editor=1.0.4=py_0 - python-flatbuffers=1.12=pyhd3eb1b0_0 + - python-fsutil=0.5.0=pyhd8ed1ab_0 - python-slugify=5.0.2=pyhd3eb1b0_0 - python_abi=3.9=1_cp39 - pytorch=1.8.1=py3.9_cuda10.2_cudnn7.6.5_0 @@ -169,11 +205,16 @@ dependencies: - readline=8.1=h27cfd23_0 - requests=2.25.1=pyhd3eb1b0_0 - requests-oauthlib=1.3.0=py_0 + - rich=10.3.0=py39hf3d152e_0 - rsa=4.7.2=pyhd3eb1b0_1 + - ruamel.yaml=0.16.12=py39h27cfd23_1 + - ruamel.yaml.clib=0.2.0=py39h27cfd23_0 - sacred=0.7.4=py_0 - scipy=1.6.2=py39had2a1c9_1 - seaborn=0.11.1=pyhd3eb1b0_0 - setuptools=52.0.0=py39h06a4308_0 + - shortuuid=1.0.1=py39hf3d152e_4 + - shtab=1.3.6=pyhd8ed1ab_0 - six=1.15.0=py39h06a4308_0 - smmap=4.0.0=pyhd3eb1b0_0 - snappy=1.1.8=he6710b0_0 @@ -189,6 +230,7 @@ dependencies: - termcolor=1.1.0=py39h06a4308_1 - text-unidecode=1.3=py_0 - tk=8.6.10=hbc83047_0 + - toml=0.10.2=pyhd3eb1b0_0 - torchaudio=0.8.1=py39 - torchvision=0.2.2=py_3 - tornado=6.1=py39h27cfd23_0 @@ -198,13 +240,17 @@ dependencies: - tzdata=2020f=h52ac0ba_0 - unidecode=1.2.0=pyhd3eb1b0_0 - urllib3=1.24.3=py_1 + - voluptuous=0.12.1=pyhd3deb0d_0 + - wcwidth=0.2.5=py_0 - websocket-client=0.58.0=py39h06a4308_4 - werkzeug=1.0.1=pyhd3eb1b0_0 - wheel=0.35.1=pyhd3eb1b0_0 - wrapt=1.12.1=py39he8ac12f_1 + - xmltodict=0.12.0=py_0 - xz=5.2.5=h7b6447c_0 - yaml=0.2.5=h7b6447c_0 - yarl=1.6.3=py39h27cfd23_0 + - zc.lockfile=2.0=py_0 - zipp=3.4.1=pyhd3eb1b0_0 - zlib=1.2.11=h7b6447c_3 - zstd=1.4.9=haebb681_0