Skip to content

Commit

Permalink
Update model card for h2oai/h2ogpt-oig-oasst1-512-6.9b
Browse files Browse the repository at this point in the history
  • Loading branch information
arnocandel committed Apr 23, 2023
1 parent 6f6ac27 commit fcaae7e
Show file tree
Hide file tree
Showing 2 changed files with 17 additions and 8 deletions.
4 changes: 2 additions & 2 deletions models/README-template.md
Original file line number Diff line number Diff line change
Expand Up @@ -11,7 +11,7 @@ tags:
- large language model
- open-source
datasets:
- <<DATASET_NAME>>
<<DATASET_NAME>>
---
# h2oGPT Model Card
## Summary
Expand All @@ -21,7 +21,7 @@ H2O.ai's `<<MODEL_NAME>>` is a <<MODEL_SIZE>> billion parameter instruction-foll
- Base model: <<BASE_MODEL>>
- Fine-tuning dataset: <<DATASET>>
- Data-prep and fine-tuning code: [H2O.ai GitHub](https://github.com/h2oai/h2ogpt)
- Training logs: [zip](<<TRAINING_LOGS>>)
- Training logs: <<TRAINING_LOGS>>

## Chatbot

Expand Down
21 changes: 15 additions & 6 deletions models/create_model_cards.py
Original file line number Diff line number Diff line change
Expand Up @@ -37,8 +37,14 @@
(
"h2ogpt-oig-oasst1-512-6.9b",
"EleutherAI/pythia-6.9b",
"h2oai/h2ogpt-oig-oasst1-instruct-cleaned-v1",
"https://huggingface.co/h2oai/h2ogpt-oig-oasst1-512-6.9b/blob/main/pythia-6.9b.h2ogpt-oig-oasst1-instruct-cleaned-v1.json.1_epochs.5fc91911bc2bfaaf3b6c2de577c4b0ae45a07a4a.7.zip",
[
"h2oai/h2ogpt-oig-oasst1-instruct-cleaned-v1",
"h2oai/openassistant_oasst1_h2ogpt",
],
[
"https://huggingface.co/h2oai/h2ogpt-oig-oasst1-512-6.9b/blob/main/pythia-6.9b.h2ogpt-oig-oasst1-instruct-cleaned-v1.json.1_epochs.5fc91911bc2bfaaf3b6c2de577c4b0ae45a07a4a.7.zip",
"https://huggingface.co/h2oai/h2ogpt-oig-oasst1-512-6.9b/blob/main/h2ogpt-oig-oasst1-512-6.9b.h2oaiopenassistant_oasst1_h2ogpt.2_epochs.e35e2e06e0af2f7dceac2e16e3646c90ccce4ec0.1.zip",
],
),
(
"h2ogpt-oig-oasst1-256-20b",
Expand Down Expand Up @@ -82,10 +88,11 @@ def test_create_model_cards(model_name, base_model, dataset, training_logs):
content = content.replace("<<BASE_MODEL>>", f"[{base_model}](https://huggingface.co/{base_model})")

assert "<<DATASET>>" in content
content = content.replace("<<DATASET>>", f"[{dataset}](https://huggingface.co/datasets/{dataset})")

assert "<<DATASET_NAME>>" in content
content = content.replace("<<DATASET_NAME>>", dataset)
if not isinstance(dataset, list):
dataset = [dataset]
content = content.replace("<<DATASET>>", " and ".join([f"[{d}](https://huggingface.co/datasets/{d})" for d in dataset]))
content = content.replace("<<DATASET_NAME>>", "\n".join([f"- {d}" for d in dataset]))

assert "<<MODEL_ARCH>>" in content
content = content.replace("<<MODEL_ARCH>>", model_arch)
Expand All @@ -94,7 +101,9 @@ def test_create_model_cards(model_name, base_model, dataset, training_logs):
content = content.replace("<<MODEL_CONFIG>>", model_config)

assert "<<TRAINING_LOGS>>" in content
content = content.replace("<<TRAINING_LOGS>>", training_logs)
if not isinstance(training_logs, list):
training_logs = [training_logs]
content = content.replace("<<TRAINING_LOGS>>", " and ".join(f"[zip]({t})" for t in training_logs))

assert "<<" not in content
assert ">>" not in content
Expand Down

0 comments on commit fcaae7e

Please sign in to comment.