-
-
Notifications
You must be signed in to change notification settings - Fork 12
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
- Loading branch information
Showing
3,726 changed files
with
238,117 additions
and
0 deletions.
The diff you're trying to view is too large. We only load the first 3000 changed files.
There are no files selected for viewing
9 changes: 9 additions & 0 deletions
9
experiments/fanoutqa/cohere-hf/baseline/00065f204bddb94d/events.jsonl
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,9 @@ | ||
{"type":"kani_spawn","timestamp":1731993444.7135954,"id":"7afacc4d-df0c-434e-bb67-d6b1cdf674d8","depth":0,"parent":null,"children":[],"always_included_messages":[],"chat_history":[],"state":"stopped","name":"root","engine_type":"CommandRVLLMEngine","engine_repr":"CommandRVLLMEngine(model=<vllm.engine.async_llm_engine.AsyncLLMEngine object at 0x7fd714657ed0>, tokenizer=CachedCohereTokenizerFast(name_or_path='CohereForAI/c4ai-command-r-plus-08-2024', vocab_size=255000, model_max_length=1000000000000000019884624838656, is_fast=True, padding_side='left', truncation_side='left', special_tokens={'bos_token': '<BOS_TOKEN>', 'eos_token': '<|END_OF_TURN_TOKEN|>', 'pad_token': '<PAD>'}, clean_up_tokenization_spaces=False), added_tokens_decoder={\n\t0: AddedToken(\"<PAD>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True),\n\t1: AddedToken(\"<UNK>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True),\n\t2: AddedToken(\"<CLS>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True),\n\t3: AddedToken(\"<SEP>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True),\n\t4: AddedToken(\"<MASK_TOKEN>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True),\n\t5: AddedToken(\"<BOS_TOKEN>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True),\n\t6: AddedToken(\"<EOS_TOKEN>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True),\n\t7: AddedToken(\"<EOP_TOKEN>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True),\n\t255000: AddedToken(\"<|START_OF_TURN_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255001: AddedToken(\"<|END_OF_TURN_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True),\n\t255002: AddedToken(\"<|YES_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255003: AddedToken(\"<|NO_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255004: AddedToken(\"<|GOOD_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255005: AddedToken(\"<|BAD_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255006: AddedToken(\"<|USER_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255007: AddedToken(\"<|CHATBOT_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255008: AddedToken(\"<|SYSTEM_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255009: AddedToken(\"<|USER_0_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255010: AddedToken(\"<|USER_1_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255011: AddedToken(\"<|USER_2_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255012: AddedToken(\"<|USER_3_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255013: AddedToken(\"<|USER_4_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255014: AddedToken(\"<|USER_5_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255015: AddedToken(\"<|USER_6_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255016: AddedToken(\"<|USER_7_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255017: AddedToken(\"<|USER_8_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255018: AddedToken(\"<|USER_9_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255019: AddedToken(\"<|EXTRA_0_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255020: AddedToken(\"<|EXTRA_1_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255021: AddedToken(\"<|EXTRA_2_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255022: AddedToken(\"<|EXTRA_3_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255023: AddedToken(\"<|EXTRA_4_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255024: AddedToken(\"<|EXTRA_5_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255025: AddedToken(\"<|EXTRA_6_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255026: AddedToken(\"<|EXTRA_7_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255027: AddedToken(\"<|EXTRA_8_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255028: AddedToken(\"<|EXTRA_9_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n}, max_context_size=128000, hyperparams={'sampling_params': SamplingParams(n=1, presence_penalty=0.0, frequency_penalty=0.0, repetition_penalty=1.0, temperature=0.7, top_p=1.0, top_k=-1, min_p=0.0, seed=None, stop=[], stop_token_ids=[], bad_words=[], include_stop_str_in_output=False, ignore_eos=False, max_tokens=2048, min_tokens=1, logprobs=None, prompt_logprobs=None, skip_special_tokens=True, spaces_between_special_tokens=True, truncate_prompt_tokens=None, guided_decoding=None)}, pipeline=ChatTemplatePromptPipeline([]))","functions":[{"name":"search","desc":"Search Wikipedia for an article with the given title, and get its content. If no such article is found, return similar article names.","auto_retry":true,"auto_truncate":null,"after":"assistant","json_schema":{"properties":{"query":{"type":"string"}},"required":["query"],"type":"object"}}]} | ||
{"type":"kani_state_change","timestamp":1731993444.7137208,"id":"7afacc4d-df0c-434e-bb67-d6b1cdf674d8","state":"running"} | ||
{"type":"kani_message","timestamp":1731993444.7137537,"id":"7afacc4d-df0c-434e-bb67-d6b1cdf674d8","msg":{"role":"user","content":"What are the years of birth of the authors of the top 5 best-selling books?","name":null,"tool_call_id":null,"tool_calls":null,"is_tool_call_error":null}} | ||
{"type":"root_message","timestamp":1731993444.7137609,"msg":{"role":"user","content":"What are the years of birth of the authors of the top 5 best-selling books?","name":null,"tool_call_id":null,"tool_calls":null,"is_tool_call_error":null}} | ||
{"type":"kani_message","timestamp":1731993453.6062393,"id":"7afacc4d-df0c-434e-bb67-d6b1cdf674d8","msg":{"role":"assistant","content":"Not all the authors of the top five best-selling books are known, but here are the birth years of the known authors:\n\n* *The Little Prince* by Antoine de Saint-Exupéry, born in 1900\n* *The Lord of the Rings* by J.R.R. Tolkien, born in 1892\n* *The Hobbit* by J.R.R. Tolkien, born in 1892","name":null,"tool_call_id":null,"tool_calls":null,"is_tool_call_error":null}} | ||
{"type":"root_message","timestamp":1731993453.6062539,"msg":{"role":"assistant","content":"Not all the authors of the top five best-selling books are known, but here are the birth years of the known authors:\n\n* *The Little Prince* by Antoine de Saint-Exupéry, born in 1900\n* *The Lord of the Rings* by J.R.R. Tolkien, born in 1892\n* *The Hobbit* by J.R.R. Tolkien, born in 1892","name":null,"tool_call_id":null,"tool_calls":null,"is_tool_call_error":null}} | ||
{"type":"tokens_used","timestamp":1731993453.6062624,"id":"7afacc4d-df0c-434e-bb67-d6b1cdf674d8","prompt_tokens":852,"completion_tokens":129} | ||
{"type":"kani_state_change","timestamp":1731993453.6062832,"id":"7afacc4d-df0c-434e-bb67-d6b1cdf674d8","state":"stopped"} | ||
{"type":"round_complete","timestamp":1731993453.6062942,"session_id":"1731993444-12dcf2e1-955c-422d-b85d-2ca45b1f5dc1"} |
57 changes: 57 additions & 0 deletions
57
experiments/fanoutqa/cohere-hf/baseline/00065f204bddb94d/state.json
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,57 @@ | ||
{ | ||
"id": "1731993444-12dcf2e1-955c-422d-b85d-2ca45b1f5dc1", | ||
"title": "fanoutqa: What are the years of birth of the authors of the top 5 best-selling books? (00065f204bddb94d)", | ||
"last_modified": 1731993453.6740694, | ||
"n_events": 9, | ||
"state": [ | ||
{ | ||
"id": "7afacc4d-df0c-434e-bb67-d6b1cdf674d8", | ||
"depth": 0, | ||
"parent": null, | ||
"children": [], | ||
"always_included_messages": [], | ||
"chat_history": [ | ||
{ | ||
"role": "user", | ||
"content": "What are the years of birth of the authors of the top 5 best-selling books?", | ||
"name": null, | ||
"tool_call_id": null, | ||
"tool_calls": null, | ||
"is_tool_call_error": null | ||
}, | ||
{ | ||
"role": "assistant", | ||
"content": "Not all the authors of the top five best-selling books are known, but here are the birth years of the known authors:\n\n* *The Little Prince* by Antoine de Saint-Exup\u00e9ry, born in 1900\n* *The Lord of the Rings* by J.R.R. Tolkien, born in 1892\n* *The Hobbit* by J.R.R. Tolkien, born in 1892", | ||
"name": null, | ||
"tool_call_id": null, | ||
"tool_calls": null, | ||
"is_tool_call_error": null | ||
} | ||
], | ||
"state": "stopped", | ||
"name": "root", | ||
"engine_type": "CommandRVLLMEngine", | ||
"engine_repr": "CommandRVLLMEngine(model=<vllm.engine.async_llm_engine.AsyncLLMEngine object at 0x7fd714657ed0>, tokenizer=CachedCohereTokenizerFast(name_or_path='CohereForAI/c4ai-command-r-plus-08-2024', vocab_size=255000, model_max_length=1000000000000000019884624838656, is_fast=True, padding_side='left', truncation_side='left', special_tokens={'bos_token': '<BOS_TOKEN>', 'eos_token': '<|END_OF_TURN_TOKEN|>', 'pad_token': '<PAD>'}, clean_up_tokenization_spaces=False), added_tokens_decoder={\n\t0: AddedToken(\"<PAD>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True),\n\t1: AddedToken(\"<UNK>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True),\n\t2: AddedToken(\"<CLS>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True),\n\t3: AddedToken(\"<SEP>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True),\n\t4: AddedToken(\"<MASK_TOKEN>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True),\n\t5: AddedToken(\"<BOS_TOKEN>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True),\n\t6: AddedToken(\"<EOS_TOKEN>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True),\n\t7: AddedToken(\"<EOP_TOKEN>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True),\n\t255000: AddedToken(\"<|START_OF_TURN_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255001: AddedToken(\"<|END_OF_TURN_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True),\n\t255002: AddedToken(\"<|YES_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255003: AddedToken(\"<|NO_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255004: AddedToken(\"<|GOOD_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255005: AddedToken(\"<|BAD_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255006: AddedToken(\"<|USER_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255007: AddedToken(\"<|CHATBOT_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255008: AddedToken(\"<|SYSTEM_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255009: AddedToken(\"<|USER_0_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255010: AddedToken(\"<|USER_1_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255011: AddedToken(\"<|USER_2_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255012: AddedToken(\"<|USER_3_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255013: AddedToken(\"<|USER_4_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255014: AddedToken(\"<|USER_5_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255015: AddedToken(\"<|USER_6_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255016: AddedToken(\"<|USER_7_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255017: AddedToken(\"<|USER_8_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255018: AddedToken(\"<|USER_9_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255019: AddedToken(\"<|EXTRA_0_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255020: AddedToken(\"<|EXTRA_1_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255021: AddedToken(\"<|EXTRA_2_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255022: AddedToken(\"<|EXTRA_3_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255023: AddedToken(\"<|EXTRA_4_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255024: AddedToken(\"<|EXTRA_5_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255025: AddedToken(\"<|EXTRA_6_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255026: AddedToken(\"<|EXTRA_7_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255027: AddedToken(\"<|EXTRA_8_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n\t255028: AddedToken(\"<|EXTRA_9_TOKEN|>\", rstrip=False, lstrip=False, single_word=False, normalized=False, special=False),\n}, max_context_size=128000, hyperparams={'sampling_params': SamplingParams(n=1, presence_penalty=0.0, frequency_penalty=0.0, repetition_penalty=1.0, temperature=0.7, top_p=1.0, top_k=-1, min_p=0.0, seed=None, stop=[], stop_token_ids=[], bad_words=[], include_stop_str_in_output=False, ignore_eos=False, max_tokens=2048, min_tokens=1, logprobs=None, prompt_logprobs=None, skip_special_tokens=True, spaces_between_special_tokens=True, truncate_prompt_tokens=None, guided_decoding=None)}, pipeline=ChatTemplatePromptPipeline([]))", | ||
"functions": [ | ||
{ | ||
"name": "search", | ||
"desc": "Search Wikipedia for an article with the given title, and get its content. If no such article is found, return similar article names.", | ||
"auto_retry": true, | ||
"auto_truncate": null, | ||
"after": "assistant", | ||
"json_schema": { | ||
"properties": { | ||
"query": { | ||
"type": "string" | ||
} | ||
}, | ||
"required": [ | ||
"query" | ||
], | ||
"type": "object" | ||
} | ||
} | ||
] | ||
} | ||
] | ||
} |
Oops, something went wrong.