Skip to content

Instantly share code, notes, and snippets.

@relyt0925
Created August 18, 2024 19:14
Show Gist options
  • Save relyt0925/fe77c510acaadfac440c0d9c71116eed to your computer and use it in GitHub Desktop.
Save relyt0925/fe77c510acaadfac440c0d9c71116eed to your computer and use it in GitHub Desktop.
skills recipe
[root@tyler-a100 instructlab]# cat /var/mnt/inststg1/instructlab/generated/skills_recipe_2024-08-17T15_42_00.yaml
datasets:
- path: /usr/share/instructlab/sdg/datasets/skills.jsonl
sampling_size: 1.0
- path: node_datasets_2024-08-17T15_42_00/knowledge_compliance_personally-identifiable-information_p10.jsonl
sampling_size: 1.0
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_general_tables_editing_add_remove.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_general_tables_editing_combining_altering.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_general_tables_empty.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_abstractive_title.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_abstractive_abstract.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_abstractive_outline.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_abstractive_main_takeaway.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_abstractive_key_points.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_services_agreement_bullet_points.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_services_agreement_plain_text.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_services_agreement_reasoning.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_inference_qualitative_sentiment.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_inference_quantitative_asciidoc_tables.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_inference_quantitative_table_analaysis.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_invoice_bullet_points.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_invoice_markdown.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_invoice_csv.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_invoice_plain_text.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_invoice_reasoning.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_information_named_entities_person_names.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_information_named_entities_places.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_information_named_entities_dates_and_events.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_receipt_bullet_points.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_receipt_markdown.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_receipt_csv.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_receipt_plain_text.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_receipt_reasoning.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_commercial_lease_agreement_bullet_points.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_commercial_lease_agreement_markdown.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_commercial_lease_agreement_csv.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_commercial_lease_agreement_plain_text.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_commercial_lease_agreement_reasoning.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_technical_paper_equations_bullet_points.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_technical_paper_equations_markdown.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_technical_paper_equations_csv.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_technical_paper_equations_plain_text.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_technical_paper_equations_reasoning.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_technical_paper_tables_bullet_points.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_technical_paper_tables_csv.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_technical_paper_tables_plain_text.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_technical_paper_tables_reasoning.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_technical_paper_abstract_bullet_points.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_technical_paper_abstract_markdown.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_technical_paper_abstract_csv.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_technical_paper_abstract_plain_text.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_technical_paper_abstract_reasoning.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_annual_report_markdown.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_annual_report_csv.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_annual_report_plain_text.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_annual_report_reasoning.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_fda_filing_bullet_points.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_fda_filing_markdown.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_fda_filing_csv.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_fda_filing_plain_text.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_fda_filing_reasoning.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_email_bullet_points.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_email_plain_text.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_extraction_email_reasoning.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_roleplay_explain_like_you_are_abstract.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_roleplay_explain_like_you_are_non_fictional_historical_figures.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_roleplay_explain_like_you_are_non_fictional_popular_personalities.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_roleplay_explain_like_you_are_fictional_tv_shows.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_roleplay_explain_like_you_are_fictional_movies.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_roleplay_explain_like_you_are_fictional_video_games.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_roleplay_explain_like_i_am_primary_schooler.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_roleplay_explain_like_i_am_graduate.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_linguistics_jumbled_sentences.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_linguistics_pattern_recognition.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_linguistics_complete_common_expressions.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_linguistics_summarization_ignore_pii.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_linguistics_summarization_list_of_sentences.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_linguistics_organize_lists.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_linguistics_word_gen.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_linguistics_rhyming_words.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_linguistics_reversing_string.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_linguistics_classification_agent_classification.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_STEM_science_geography.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_STEM_science_units_conversion_temperature_conversion.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_STEM_science_units_conversion_distance_conversion.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_STEM_math_pattern_recognition.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_STEM_math_area.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_STEM_math_mensurational.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_STEM_math_arithmetic_reasoning.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_STEM_math_time_series.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_STEM_math_distance_conversion.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_STEM_math_arithmetic_w_grammar.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_STEM_math_reasoning.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_grounded_summarization_wiki_insights_concise.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_grounded_summarization_wiki_insights_five_point.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_grounded_summarization_wiki_insights_detailed.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_grounded_summarization_wiki_insights_high_level_outline.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_grounded_summarization_wiki_insights_one_line.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_grounded_meeting_insights_executive_summaries.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_grounded_meeting_insights_corporate_email.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_grounded_meeting_insights_minutes_of_meeting.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_grounded_meeting_insights_action_items.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_grounded_editing_grammar.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_grounded_editing_spelling.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_grounded_editing_punctuation.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_freeform_poetry_sonnet.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_freeform_poetry_haiku.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_freeform_poetry_limerick.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_freeform_social_media_linkedin.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_freeform_social_media_twitter.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_freeform_social_media_facebook.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_freeform_legal_contracts.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_freeform_legal_agreement.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_freeform_jokes_puns_general.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_freeform_riddles.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_freeform_brainstorming_refute_claim.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_freeform_brainstorming_support_claim.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_freeform_brainstorming_idea_generation.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_freeform_grammar_basic_grammer_tests.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_freeform_debate.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_freeform_emoji.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_freeform_prose_emails_formal.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_freeform_prose_emails_informal.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_freeform_prose_articles.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_freeform_prose_screenplay.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_freeform_technical_product_description.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_freeform_technical_user_manual.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_freeform_technical_proposal.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_freeform_technical_guide.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_freeform_technical_report.jsonl
sampling_size: 30
- path: node_datasets_2024-08-17T15_42_00/compositional_skills_writing_freeform_technical_specification.jsonl
sampling_size: 30
metadata:
sys_prompt: "I am, Red Hat\xAE Instruct Model based on Granite 7B, an AI language\
\ model developed by Red Hat and IBM Research, based on the Granite-7b-base language\
\ model. My primary function is to be a chat assistant."
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment