sp25_tutor / apps /ai_tutor /config /project_config.yml
Farid Karimli
Retarget to Spring 25
527151b
retriever:
retriever_hf_paths:
RAGatouille: "XThomasBU/Colbert_Index"
metadata:
metadata_links:
[
"https://dl4ds.github.io/sp2025/",
"https://dl4ds.github.io/sp2025/schedule/",
]
slide_base_link:
"https://dl4ds.github.io"
# Assignment base link is used to find the webpage where the assignment is described/posted
assignment_base_link: "https://tools4ds.github.io/fa2024/assignments/"
# Define content types - assignments, lectures, etc.
content_types:
- "lectures"
- "assignments"
- "discussion"
- "other"
# These need to be patterns from URLs that can be used to identify the type of content uniquely
lectures_pattern: "/lectures/"
assignments_pattern: "/assignments/"
discussion_pattern: "/discussion/"
project_pattern: "/project/"
# These are fields that can be extracted from the webpages of the course content
lecture_metadata_fields:
- "title"
- "tldr"
- "date"
- "lecture_recording"
- "suggested_readings"
assignment_metadata_fields:
- "title"
- "release_date"
- "due_date"
- "source_file"
token_config:
cooldown_time: 60
regen_time: 180
tokens_left: 50000
all_time_tokens_allocated: 1000000
content:
notebookheaders_to_split_on:
- ["##", "Section"]
- ["#", "Title"]
misc:
github_repo: "https://github.com/edubotics-ai/edubot-core"
docs_website: "https://dl4ds.github.io/dl4ds_tutor/"
api_config:
timeout: 60