add train config and metadata

Browse files

Files changed (4) hide show

conda-environment.yaml +200 -0
config.yaml +837 -0
wandb-metadata.json +117 -0
wandb-summary.json +1 -0

conda-environment.yaml ADDED Viewed

	@@ -0,0 +1,200 @@

+name: pie-document-level
+channels:
+  - pytorch
+  - defaults
+dependencies:
+  - _libgcc_mutex=0.1=main
+  - _openmp_mutex=5.1=1_gnu
+  - ca-certificates=2023.05.30=h06a4308_0
+  - ld_impl_linux-64=2.38=h1181459_1
+  - libffi=3.4.4=h6a678d5_0
+  - libgcc-ng=11.2.0=h1234567_1
+  - libgomp=11.2.0=h1234567_1
+  - libstdcxx-ng=11.2.0=h1234567_1
+  - ncurses=6.4=h6a678d5_0
+  - openssl=3.0.10=h7f8727e_2
+  - pip=23.2.1=py39h06a4308_0
+  - python=3.9.17=h955ad1f_0
+  - readline=8.2=h5eee18b_0
+  - setuptools=68.0.0=py39h06a4308_0
+  - sqlite=3.41.2=h5eee18b_0
+  - tk=8.6.12=h1ccaba5_0
+  - wheel=0.38.4=py39h06a4308_0
+  - xz=5.4.2=h5eee18b_0
+  - zlib=1.2.13=h5eee18b_0
+  - pip:
+      - absl-py==1.4.0
+      - accelerate==0.22.0
+      - aiohttp==3.8.5
+      - aiosignal==1.3.1
+      - alembic==1.12.0
+      - annotated-types==0.5.0
+      - antlr4-python3-runtime==4.9.3
+      - appdirs==1.4.4
+      - asciidag==0.2.0
+      - async-timeout==4.0.3
+      - attrs==23.1.0
+      - auto-gptq==0.4.2
+      - autopage==0.5.1
+      - black==23.7.0
+      - blis==0.7.10
+      - catalogue==2.0.9
+      - certifi==2023.7.22
+      - cfgv==3.4.0
+      - charset-normalizer==3.2.0
+      - click==8.1.7
+      - cliff==4.3.0
+      - cmaes==0.10.0
+      - cmake==3.27.4.1
+      - cmd2==2.4.3
+      - coloredlogs==15.0.1
+      - colorlog==6.7.0
+      - confection==0.1.1
+      - coverage==7.3.0
+      - cymem==2.0.7
+      - datasets==2.14.4
+      - dill==0.3.7
+      - distlib==0.3.7
+      - docker-pycreds==0.4.0
+      - en-core-web-trf==3.6.1
+      - exceptiongroup==1.1.3
+      - fastjsonschema==2.18.0
+      - filelock==3.12.3
+      - flake8==6.1.0
+      - frozenlist==1.4.0
+      - fsspec==2023.6.0
+      - gitdb==4.0.10
+      - gitpython==3.1.34
+      - greenlet==2.0.2
+      - huggingface-hub==0.19.4
+      - humanfriendly==10.0
+      - hydra-colorlog==1.2.0
+      - hydra-core==1.3.2
+      - hydra-optuna-sweeper==1.2.0
+      - identify==2.5.27
+      - idna==3.4
+      - importlib-metadata==6.8.0
+      - iniconfig==2.0.0
+      - isort==5.12.0
+      - jedi==0.19.0
+      - jinja2==3.1.2
+      - joblib==1.3.2
+      - jsonschema==4.19.0
+      - jsonschema-specifications==2023.7.1
+      - jupyter-core==5.3.1
+      - langcodes==3.3.0
+      - lightning-utilities==0.9.0
+      - lit==16.0.6
+      - mako==1.2.4
+      - markdown-it-py==3.0.0
+      - markupsafe==2.1.3
+      - mccabe==0.7.0
+      - mdurl==0.1.2
+      - mpmath==1.3.0
+      - multidict==6.0.4
+      - multiprocess==0.70.15
+      - murmurhash==1.0.9
+      - mypy-extensions==1.0.0
+      - nbformat==5.9.2
+      - nbstripout==0.6.1
+      - networkx==3.1
+      - nltk==3.8.1
+      - nodeenv==1.8.0
+      - numpy==1.25.2
+      - nvidia-cublas-cu11==11.10.3.66
+      - nvidia-cuda-cupti-cu11==11.7.101
+      - nvidia-cuda-nvrtc-cu11==11.7.99
+      - nvidia-cuda-runtime-cu11==11.7.99
+      - nvidia-cudnn-cu11==8.5.0.96
+      - nvidia-cufft-cu11==10.9.0.58
+      - nvidia-curand-cu11==10.2.10.91
+      - nvidia-cusolver-cu11==11.4.0.1
+      - nvidia-cusparse-cu11==11.7.4.91
+      - nvidia-nccl-cu11==2.14.3
+      - nvidia-nvtx-cu11==11.7.91
+      - omegaconf==2.3.0
+      - optimum==1.12.0
+      - optuna==2.10.1
+      - packaging==23.1
+      - pandas==2.1.0
+      - parso==0.8.3
+      - pathspec==0.11.2
+      - pathtools==0.1.2
+      - pathy==0.10.2
+      - pbr==5.11.1
+      - peft==0.5.0
+      - pie-datasets==0.8.1
+      - pie-models==0.3.0
+      - pie-modules==0.10.6
+      - platformdirs==3.10.0
+      - plotext==5.2.8
+      - pluggy==1.3.0
+      - pre-commit==3.4.0
+      - preshed==3.0.8
+      - prettytable==3.8.0
+      - protobuf==4.24.2
+      - psutil==5.9.5
+      - pudb==2022.1.3
+      - pyarrow==13.0.0
+      - pycodestyle==2.11.0
+      - pydantic==2.3.0
+      - pydantic-core==2.6.3
+      - pyflakes==3.1.0
+      - pygments==2.16.1
+      - pyperclip==1.8.2
+      - pyrootutils==1.0.4
+      - pytest==7.4.1
+      - pytest-cov==4.1.0
+      - python-dateutil==2.8.2
+      - python-dotenv==1.0.0
+      - pytorch-crf==0.7.2
+      - pytorch-ie==0.29.8
+      - pytorch-lightning==2.1.2
+      - pytz==2023.3.post1
+      - pyyaml==6.0.1
+      - referencing==0.30.2
+      - regex==2023.8.8
+      - requests==2.31.0
+      - rich==13.5.2
+      - rouge==1.0.1
+      - rpds-py==0.10.2
+      - safetensors==0.3.3
+      - scipy==1.11.2
+      - sentencepiece==0.1.99
+      - sentry-sdk==1.30.0
+      - setproctitle==1.3.2
+      - sh==2.0.6
+      - six==1.16.0
+      - smart-open==6.3.0
+      - smmap==5.0.0
+      - spacy-alignments==0.9.0
+      - spacy-legacy==3.0.12
+      - spacy-loggers==1.0.4
+      - sqlalchemy==2.0.20
+      - srsly==2.4.7
+      - stevedore==5.1.0
+      - sympy==1.12
+      - tabulate==0.9.0
+      - thinc==8.1.12
+      - tokenizers==0.15.0
+      - tomli==2.0.1
+      - torch==2.0.0
+      - torchmetrics==1.1.1
+      - tqdm==4.66.1
+      - traitlets==5.9.0
+      - transformers==4.36.0
+      - triton==2.0.0
+      - typer==0.9.0
+      - typing-extensions==4.7.1
+      - tzdata==2023.3
+      - urllib3==2.0.4
+      - urwid==2.1.2
+      - urwid-readline==0.13
+      - virtualenv==20.24.4
+      - wandb==0.15.9
+      - wasabi==1.1.2
+      - wcwidth==0.2.6
+      - xxhash==3.3.0
+      - yarl==1.9.2
+      - zipp==3.16.2
+prefix: /home/arne/miniconda3/envs/pie-document-level

config.yaml ADDED Viewed

	@@ -0,0 +1,837 @@

+wandb_version: 1
+_wandb:
+  desc: null
+  value:
+    python_version: 3.9.17
+    cli_version: 0.15.9
+    framework: huggingface
+    huggingface_version: 4.36.0
+    is_jupyter_run: false
+    is_kaggle_kernel: false
+    start_time: 1709313942.075548
+    t:
+      1:
+      - 1
+      - 9
+      - 11
+      - 49
+      - 50
+      - 51
+      - 55
+      - 71
+      - 103
+      2:
+      - 1
+      - 9
+      - 11
+      - 49
+      - 50
+      - 51
+      - 55
+      - 71
+      - 103
+      3:
+      - 2
+      - 7
+      - 15
+      - 23
+      4: 3.9.17
+      5: 0.15.9
+      6: 4.36.0
+      8:
+      - 5
+    m:
+    - 1: trainer/global_step
+      6:
+      - 3
+    - 1: loss/train_step
+      5: 1
+      6:
+      - 1
+    - 1: epoch
+      5: 1
+      6:
+      - 1
+    - 1: loss/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/exact_encoding_matches/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/decoding_errors/all/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/micro/f1/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/micro/recall/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/micro/precision/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/background_claim/f1/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/background_claim/recall/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/background_claim/precision/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/data/f1/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/data/recall/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/data/precision/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/own_claim/f1/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/own_claim/recall/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/own_claim/precision/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/macro/f1/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/macro/recall/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/macro/precision/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/micro/f1/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/micro/recall/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/micro/precision/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/parts_of_same/f1/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/parts_of_same/recall/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/parts_of_same/precision/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/supports/f1/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/supports/recall/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/supports/precision/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/contradicts/f1/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/contradicts/recall/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/contradicts/precision/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/macro/f1/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/macro/recall/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/macro/precision/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/semantically_same/f1/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/semantically_same/recall/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/semantically_same/precision/val
+      5: 1
+      6:
+      - 1
+    - 1: loss/train_epoch
+      5: 1
+      6:
+      - 1
+    - 1: metric/exact_encoding_matches/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/decoding_errors/label/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/decoding_errors/index/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/decoding_errors/len/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/decoding_errors/order/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/decoding_errors/correct/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/decoding_errors/all/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/background_claim/f1/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/background_claim/recall/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/background_claim/precision/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/data/f1/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/data/recall/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/data/precision/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/own_claim/f1/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/own_claim/recall/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/own_claim/precision/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/micro/f1/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/micro/recall/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/micro/precision/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/macro/f1/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/macro/recall/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/macro/precision/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/supports/f1/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/supports/recall/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/supports/precision/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/micro/f1/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/micro/recall/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/micro/precision/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/parts_of_same/f1/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/parts_of_same/recall/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/parts_of_same/precision/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/contradicts/f1/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/contradicts/recall/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/contradicts/precision/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/semantically_same/f1/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/semantically_same/recall/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/semantically_same/precision/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/macro/f1/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/macro/recall/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/macro/precision/train
+      5: 1
+      6:
+      - 1
+    - 1: metric/decoding_errors/correct/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/decoding_errors/index/val
+      5: 1
+      6:
+      - 1
+    - 1: metric/decoding_errors/len/val
+      5: 1
+      6:
+      - 1
+    - 1: loss/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/exact_encoding_matches/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/decoding_errors/correct/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/decoding_errors/all/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/micro/f1/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/micro/recall/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/micro/precision/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/own_claim/f1/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/own_claim/recall/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/own_claim/precision/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/background_claim/f1/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/background_claim/recall/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/background_claim/precision/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/data/f1/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/data/recall/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/data/precision/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/macro/f1/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/macro/recall/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/labeled_spans/macro/precision/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/micro/f1/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/micro/recall/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/micro/precision/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/parts_of_same/f1/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/parts_of_same/recall/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/parts_of_same/precision/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/supports/f1/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/supports/recall/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/supports/precision/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/contradicts/f1/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/contradicts/recall/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/contradicts/precision/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/semantically_same/f1/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/semantically_same/recall/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/semantically_same/precision/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/macro/f1/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/macro/recall/test
+      5: 1
+      6:
+      - 1
+    - 1: metric/binary_relations/macro/precision/test
+      5: 1
+      6:
+      - 1
+_num_params/total:
+  desc: null
+  value: 141788928
+_num_params/trainable:
+  desc: null
+  value: 141788928
+_num_params/non_trainable:
+  desc: null
+  value: 0
+_config:
+  desc: null
+  value:
+    pipeline_type: training
+    name: dataset-sciarg/task-ner_re/v0.3
+    tags:
+    - task=ner_re
+    - model=pointer_network
+    train: true
+    validate: true
+    test: true
+    monitor_metric: metric/binary_relations/micro/f1/val
+    monitor_mode: max
+    seed: 1
+    ckpt_path: null
+    push_to_hub: false
+    model_save_dir: /home/arne/projects/pie-document-level/models/dataset-sciarg/task-ner_re/v0.3/2024-03-01_18-25-32
+    dataset:
+      _target_: src.utils.execute_pipeline
+      input:
+        _target_: pie_datasets.DatasetDict.load_dataset
+        path: pie/sciarg
+        revision: 982d5682ba414ee13cf92cb93ec18fc8e78e2b81
+      select_n:
+        _processor_: pie_datasets.DatasetDict.select
+        split: train
+        stop: null
+      select_n_test:
+        _processor_: pie_datasets.DatasetDict.select
+        split: test
+        stop: null
+      select_n_validation:
+        _processor_: pie_datasets.DatasetDict.select
+        split: validation
+        stop: null
+      create_test_split:
+        _processor_: pie_datasets.DatasetDict.move_to_new_split
+        source_split: train
+        target_split: test
+        ids:
+        - A32
+        - A33
+        - A34
+        - A35
+        - A36
+        - A37
+        - A38
+        - A39
+        - A40
+      create_validation_split:
+        _processor_: pie_datasets.DatasetDict.add_test_split
+        test_size: 0.1
+        seed: 1
+        source_split: train
+        target_split: validation
+    datamodule:
+      _target_: src.datamodules.PieDataModule
+      batch_size: 2
+      num_workers: 0
+      pin_memory: false
+      show_progress_for_encode: true
+      train_split: train
+      val_split: validation
+      test_split: test
+    taskmodule:
+      _target_: pie_modules.taskmodules.PointerNetworkTaskModuleForEnd2EndRE
+      tokenizer_init_kwargs:
+        add_prefix_space: true
+      tokenizer_name_or_path: facebook/bart-base
+      tokenizer_kwargs:
+        truncation: true
+        return_overflowing_tokens: true
+        stride: 128
+        strict_span_conversion: false
+      create_constraints: true
+      constrained_generation: true
+      partition_layer_name: labeled_partitions
+    model:
+      _target_: pie_modules.models.SimpleGenerativeModel
+      base_model_type: pie_modules.models.base_models.BartAsPointerNetwork
+      base_model_config:
+        pretrained_model_name_or_path: facebook/bart-base
+        use_encoder_mlp: true
+        use_constraints_encoder_mlp: true
+        decoder_position_id_pattern:
+        - 0
+        - 0
+        - 1
+        - 0
+        - 0
+        - 1
+        - 1
+        encoder_layer_norm_decay: 0.005
+        lr: 6.0e-05
+        num_beams: 4
+        max_length: 768
+        decoder_layer_norm_decay: 0.05
+      metric_stages:
+      - val
+      - test
+      - train
+      metric_call_predict:
+      - val
+      - test
+      warmup_proportion: 0.01
+    callbacks:
+      model_checkpoint:
+        _target_: pytorch_lightning.callbacks.ModelCheckpoint
+        dirpath: /home/arne/projects/pie-document-level/logs/training/multiruns/dataset-sciarg/task-ner_re/v0.3/2024-03-01_18-25-31/0/checkpoints
+        filename: epoch_{epoch:03d}
+        monitor: metric/binary_relations/micro/f1/val
+        verbose: false
+        save_last: true
+        save_top_k: 1
+        mode: max
+        auto_insert_metric_name: false
+        save_weights_only: false
+        every_n_train_steps: null
+        train_time_interval: null
+        every_n_epochs: null
+        save_on_train_epoch_end: null
+      early_stopping:
+        _target_: pytorch_lightning.callbacks.EarlyStopping
+        monitor: metric/binary_relations/micro/f1/val
+        min_delta: 0.0
+        patience: 100
+        verbose: false
+        mode: max
+        strict: true
+        check_finite: true
+        stopping_threshold: null
+        divergence_threshold: null
+        check_on_train_epoch_end: null
+      model_summary:
+        _target_: pytorch_lightning.callbacks.RichModelSummary
+        max_depth: -1
+      rich_progress_bar:
+        _target_: pytorch_lightning.callbacks.RichProgressBar
+    logger:
+      wandb:
+        _target_: pytorch_lightning.loggers.wandb.WandbLogger
+        save_dir: /home/arne/projects/pie-document-level/logs/training/multiruns/dataset-sciarg/task-ner_re/v0.3/2024-03-01_18-25-31/0
+        offline: false
+        id: null
+        anonymous: null
+        project: dataset-sciarg-task-ner_re-v0.3-training
+        log_model: false
+        prefix: ''
+        group: ''
+        tags:
+        - task=ner_re
+        - model=pointer_network
+        job_type: ''
+    trainer:
+      _target_: pytorch_lightning.Trainer
+      default_root_dir: /home/arne/projects/pie-document-level/logs/training/multiruns/dataset-sciarg/task-ner_re/v0.3/2024-03-01_18-25-31/0
+      min_epochs: 150
+      max_epochs: 150
+      accelerator: gpu
+      devices: 1
+      check_val_every_n_epoch: 1
+      deterministic: false
+      gradient_clip_val: 5
+      gradient_clip_algorithm: value
+    paths:
+      root_dir: /home/arne/projects/pie-document-level
+      data_dir: /home/arne/projects/pie-document-level/data/
+      log_dir: /home/arne/projects/pie-document-level/logs/
+      output_dir: /home/arne/projects/pie-document-level/logs/training/multiruns/dataset-sciarg/task-ner_re/v0.3/2024-03-01_18-25-31/0
+      save_dir: /home/arne/projects/pie-document-level
+      work_dir: /home/arne/projects/pie-document-level
+    extras:
+      ignore_warnings: false
+      enforce_tags: true
+      print_config: true
+    base_model: facebook/bart-base
+base_model_type:
+  desc: null
+  value: pie_modules.models.base_models.BartAsPointerNetwork
+base_model_config:
+  desc: null
+  value:
+    pretrained_model_name_or_path: facebook/bart-base
+    use_encoder_mlp: true
+    use_constraints_encoder_mlp: true
+    decoder_position_id_pattern:
+    - 0
+    - 0
+    - 1
+    - 0
+    - 0
+    - 1
+    - 1
+    encoder_layer_norm_decay: 0.005
+    lr: 6.0e-05
+    num_beams: 4
+    max_length: 768
+    decoder_layer_norm_decay: 0.05
+    bos_token_id: 0
+    eos_token_id: 1
+    pad_token_id: 1
+    target_token_ids:
+    - 0
+    - 2
+    - 50267
+    - 50265
+    - 50268
+    - 50270
+    - 50271
+    - 50269
+    - 50272
+    - 50266
+    embedding_weight_mapping:
+      '50267':
+      - 4146
+      '50265':
+      - 3618
+      - 1215
+      - 31628
+      '50268':
+      - 414
+      '50270':
+      - 308
+      - 1215
+      - 31628
+      '50271':
+      - 37820
+      '50269':
+      - 1667
+      - 1215
+      - 1116
+      - 1215
+      - 41690
+      '50272':
+      - 9031
+      - 38600
+      - 1215
+      - 41690
+      '50266':
+      - 4548
+override_generation_kwargs:
+  desc: null
+  value: null
+warmup_proportion:
+  desc: null
+  value: 0.01
+learning_rate:
+  desc: null
+  value: null
+optimizer_type:
+  desc: null
+  value: null
+metric_stages:
+  desc: null
+  value:
+  - val
+  - test
+  - train
+metric_call_predict:
+  desc: null
+  value:
+  - val
+  - test
+taskmodule_config:
+  desc: null
+  value:
+    taskmodule_type: PointerNetworkTaskModuleForEnd2EndRE
+    tokenizer_name_or_path: facebook/bart-base
+    document_type: pytorch_ie.documents.TextDocumentWithLabeledSpansBinaryRelationsAndLabeledPartitions
+    tokenized_document_type: pie_modules.documents.TokenDocumentWithLabeledSpansBinaryRelationsAndLabeledPartitions
+    span_layer_name: labeled_spans
+    relation_layer_name: binary_relations
+    none_label: none
+    loop_dummy_relation_name: loop
+    constrained_generation: true
+    label_tokens: null
+    label_representations: null
+    labels_per_layer:
+      labeled_spans:
+      - background_claim
+      - data
+      - own_claim
+      binary_relations:
+      - contradicts
+      - parts_of_same
+      - semantically_same
+      - supports
+    exclude_labels_per_layer: null
+    create_constraints: true
+    tokenizer_init_kwargs:
+      add_prefix_space: true
+    tokenizer_kwargs:
+      truncation: true
+      return_overflowing_tokens: true
+      stride: 128
+      strict_span_conversion: false
+    partition_layer_name: labeled_partitions
+    annotation_field_mapping: null
+    log_first_n_examples: null
+_best_checkpoint:
+  desc: null
+  value: epoch_145.ckpt
+_checkpoint_dir:
+  desc: null
+  value: /mnt/data/experiments/pie-document-level/logs/training/multiruns/dataset-sciarg/task-ner_re/v0.3/2024-03-01_18-25-31/0/checkpoints

wandb-metadata.json ADDED Viewed

	@@ -0,0 +1,117 @@

+{
+    "os": "Linux-5.15.0-86-generic-x86_64-with-glibc2.35",
+    "python": "3.9.17",
+    "heartbeatAt": "2024-03-01T17:25:43.088987",
+    "startedAt": "2024-03-01T17:25:42.069556",
+    "docker": null,
+    "cuda": null,
+    "args": [
+        "experiment=generic_pointer_network_end2end_re",
+        "dataset=sciarg_prepared",
+        "+taskmodule.partition_layer_name=labeled_partitions",
+        "+taskmodule.tokenizer_kwargs.strict_span_conversion=false",
+        "+model.base_model_config.decoder_layer_norm_decay=0.05",
+        "trainer=gpu",
+        "test=true",
+        "name=dataset-sciarg/task-ner_re/v0.3",
+        "seed=1,12,123,1234,12345",
+        "++hydra.callbacks.save_job_return.integrate_multirun_result=true",
+        "--multirun"
+    ],
+    "state": "running",
+    "program": "/home/arne/projects/pie-document-level/src/train.py",
+    "codePath": "src/train.py",
+    "git": {
+        "remote": "git@github.com:ArneBinder/pie-document-level.git",
+        "commit": "6deb3a264efba32f48f10addd87ccea04d4f8b5e"
+    },
+    "email": "arne.b.binder@gmail.com",
+    "root": "/home/arne/projects/pie-document-level",
+    "host": "arne-DFKI",
+    "username": "arne",
+    "executable": "/home/arne/miniconda3/envs/pie-document-level/bin/python",
+    "cpu_count": 6,
+    "cpu_count_logical": 12,
+    "cpu_freq": {
+        "current": 2199.99725,
+        "min": 2200.0,
+        "max": 3600.0
+    },
+    "cpu_freq_per_core": [
+        {
+            "current": 2200.0,
+            "min": 2200.0,
+            "max": 3600.0
+        },
+        {
+            "current": 2200.0,
+            "min": 2200.0,
+            "max": 3600.0
+        },
+        {
+            "current": 2200.0,
+            "min": 2200.0,
+            "max": 3600.0
+        },
+        {
+            "current": 2200.0,
+            "min": 2200.0,
+            "max": 3600.0
+        },
+        {
+            "current": 2200.0,
+            "min": 2200.0,
+            "max": 3600.0
+        },
+        {
+            "current": 2200.0,
+            "min": 2200.0,
+            "max": 3600.0
+        },
+        {
+            "current": 2200.0,
+            "min": 2200.0,
+            "max": 3600.0
+        },
+        {
+            "current": 2200.0,
+            "min": 2200.0,
+            "max": 3600.0
+        },
+        {
+            "current": 2200.0,
+            "min": 2200.0,
+            "max": 3600.0
+        },
+        {
+            "current": 2200.0,
+            "min": 2200.0,
+            "max": 3600.0
+        },
+        {
+            "current": 2200.0,
+            "min": 2200.0,
+            "max": 3600.0
+        },
+        {
+            "current": 2199.967,
+            "min": 2200.0,
+            "max": 3600.0
+        }
+    ],
+    "disk": {
+        "total": 878.620922088623,
+        "used": 658.1419486999512
+    },
+    "gpu": "NVIDIA GeForce RTX 2080 Ti",
+    "gpu_count": 1,
+    "gpu_devices": [
+        {
+            "name": "NVIDIA GeForce RTX 2080 Ti",
+            "memory_total": 11811160064
+        }
+    ],
+    "memory": {
+        "total": 31.265464782714844
+    }
+}

wandb-summary.json ADDED Viewed

	@@ -0,0 +1 @@

+ {"loss/train_step": 0.01761285401880741, "epoch": 150, "trainer/global_step": 39450, "_timestamp": 1709331727.5671468, "_runtime": 17785.49159884453, "_step": 1090, "loss/val": 2.5551652908325195, "metric/exact_encoding_matches/val": 0.3253012001514435, "metric/decoding_errors/all/val": 0.0, "metric/labeled_spans/micro/f1/val": 0.4795539081096649, "metric/labeled_spans/micro/recall/val": 0.4955185651779175, "metric/labeled_spans/micro/precision/val": 0.4645858407020569, "metric/labeled_spans/background_claim/f1/val": 0.5347467660903931, "metric/labeled_spans/background_claim/recall/val": 0.5159090757369995, "metric/labeled_spans/background_claim/precision/val": 0.5550122261047363, "metric/labeled_spans/data/f1/val": 0.5673912763595581, "metric/labeled_spans/data/recall/val": 0.5661605000495911, "metric/labeled_spans/data/precision/val": 0.5686274766921997, "metric/labeled_spans/own_claim/f1/val": 0.3920493423938751, "metric/labeled_spans/own_claim/recall/val": 0.4326777756214142, "metric/labeled_spans/own_claim/precision/val": 0.3583959937095642, "metric/labeled_spans/macro/f1/val": 0.49806246161460876, "metric/labeled_spans/macro/recall/val": 0.5049158334732056, "metric/labeled_spans/macro/precision/val": 0.49401187896728516, "metric/binary_relations/micro/f1/val": 0.2759901285171509, "metric/binary_relations/micro/recall/val": 0.2657926082611084, "metric/binary_relations/micro/precision/val": 0.28700128197669983, "metric/binary_relations/parts_of_same/f1/val": 0.2459016591310501, "metric/binary_relations/parts_of_same/recall/val": 0.23999999463558197, "metric/binary_relations/parts_of_same/precision/val": 0.2521008551120758, "metric/binary_relations/supports/f1/val": 0.2857142686843872, "metric/binary_relations/supports/recall/val": 0.27953410148620605, "metric/binary_relations/supports/precision/val": 0.29217392206192017, "metric/binary_relations/contradicts/f1/val": 0.26455026865005493, "metric/binary_relations/contradicts/recall/val": 0.23364485800266266, "metric/binary_relations/contradicts/precision/val": 0.3048780560493469, "metric/binary_relations/macro/f1/val": 0.19904154539108276, "metric/binary_relations/macro/recall/val": 0.18829473853111267, "metric/binary_relations/macro/precision/val": 0.21228821575641632, "metric/binary_relations/semantically_same/f1/val": 0.0, "metric/binary_relations/semantically_same/recall/val": 0.0, "metric/binary_relations/semantically_same/precision/val": 0.0, "loss/train_epoch": 0.06590206921100616, "metric/exact_encoding_matches/train": 0.9276190400123596, "metric/decoding_errors/label/train": 0.0002683123166207224, "metric/decoding_errors/index/train": 0.0, "metric/decoding_errors/len/train": 0.0001341561583103612, "metric/decoding_errors/order/train": 0.003353904001414776, "metric/decoding_errors/correct/train": 0.9962436556816101, "metric/decoding_errors/all/train": 0.0037563724908977747, "metric/labeled_spans/background_claim/f1/train": 0.9950291514396667, "metric/labeled_spans/background_claim/recall/train": 0.9943844676017761, "metric/labeled_spans/background_claim/precision/train": 0.995674729347229, "metric/labeled_spans/data/f1/train": 0.9951720833778381, "metric/labeled_spans/data/recall/train": 0.994088351726532, "metric/labeled_spans/data/precision/train": 0.9962581992149353, "metric/labeled_spans/own_claim/f1/train": 0.997970700263977, "metric/labeled_spans/own_claim/recall/train": 0.9975208640098572, "metric/labeled_spans/own_claim/precision/train": 0.9984209537506104, "metric/labeled_spans/micro/f1/train": 0.9963851571083069, "metric/labeled_spans/micro/recall/train": 0.995685338973999, "metric/labeled_spans/micro/precision/train": 0.9970859885215759, "metric/labeled_spans/macro/f1/train": 0.9960572719573975, "metric/labeled_spans/macro/recall/train": 0.9953312277793884, "metric/labeled_spans/macro/precision/train": 0.9967846274375916, "metric/binary_relations/supports/f1/train": 0.9916067123413086, "metric/binary_relations/supports/recall/train": 0.9889978766441345, "metric/binary_relations/supports/precision/train": 0.9942293763160706, "metric/binary_relations/micro/f1/train": 0.9924262166023254, "metric/binary_relations/micro/recall/train": 0.9898684620857239, "metric/binary_relations/micro/precision/train": 0.9949973225593567, "metric/binary_relations/parts_of_same/f1/train": 0.9962507486343384, "metric/binary_relations/parts_of_same/recall/train": 0.9935897588729858, "metric/binary_relations/parts_of_same/precision/train": 0.9989258646965027, "metric/binary_relations/contradicts/f1/train": 0.9927158951759338, "metric/binary_relations/contradicts/recall/train": 0.9916840195655823, "metric/binary_relations/contradicts/precision/train": 0.9937499761581421, "metric/binary_relations/semantically_same/f1/train": 0.9818181991577148, "metric/binary_relations/semantically_same/recall/train": 0.9642857313156128, "metric/binary_relations/semantically_same/precision/train": 1.0, "metric/binary_relations/macro/f1/train": 0.9905978441238403, "metric/binary_relations/macro/recall/train": 0.9846393465995789, "metric/binary_relations/macro/precision/train": 0.9967262744903564, "metric/decoding_errors/correct/val": 1.0, "metric/decoding_errors/index/val": 0.0, "metric/decoding_errors/len/val": 0.0, "loss/test": 2.615832805633545, "metric/exact_encoding_matches/test": 0.3636363744735718, "metric/decoding_errors/correct/test": 1.0, "metric/decoding_errors/all/test": 0.0, "metric/labeled_spans/micro/f1/test": 0.4372429847717285, "metric/labeled_spans/micro/recall/test": 0.4461228549480438, "metric/labeled_spans/micro/precision/test": 0.4287096858024597, "metric/labeled_spans/own_claim/f1/test": 0.3857002258300781, "metric/labeled_spans/own_claim/recall/test": 0.4384787380695343, "metric/labeled_spans/own_claim/precision/test": 0.3442623019218445, "metric/labeled_spans/background_claim/f1/test": 0.4095562994480133, "metric/labeled_spans/background_claim/recall/test": 0.34433284401893616, "metric/labeled_spans/background_claim/precision/test": 0.5052631497383118, "metric/labeled_spans/data/f1/test": 0.5392895340919495, "metric/labeled_spans/data/recall/test": 0.5324123501777649, "metric/labeled_spans/data/precision/test": 0.5463467836380005, "metric/labeled_spans/macro/f1/test": 0.4448487162590027, "metric/labeled_spans/macro/recall/test": 0.4384079873561859, "metric/labeled_spans/macro/precision/test": 0.46529075503349304, "metric/binary_relations/micro/f1/test": 0.21993334591388702, "metric/binary_relations/micro/recall/test": 0.20381808280944824, "metric/binary_relations/micro/precision/test": 0.2388157844543457, "metric/binary_relations/parts_of_same/f1/test": 0.19502867758274078, "metric/binary_relations/parts_of_same/recall/test": 0.1764705926179886, "metric/binary_relations/parts_of_same/precision/test": 0.21794871985912323, "metric/binary_relations/supports/f1/test": 0.22637012600898743, "metric/binary_relations/supports/recall/test": 0.21079881489276886, "metric/binary_relations/supports/precision/test": 0.24442538619041443, "metric/binary_relations/contradicts/f1/test": 0.2039215862751007, "metric/binary_relations/contradicts/recall/test": 0.18978102505207062, "metric/binary_relations/contradicts/precision/test": 0.22033898532390594, "metric/binary_relations/semantically_same/f1/test": 0.4000000059604645, "metric/binary_relations/semantically_same/recall/test": 0.3333333432674408, "metric/binary_relations/semantically_same/precision/test": 0.5, "metric/binary_relations/macro/f1/test": 0.25633010268211365, "metric/binary_relations/macro/recall/test": 0.2275959551334381, "metric/binary_relations/macro/precision/test": 0.2956782579421997, "_wandb": {"runtime": 17784}}