Spaces:
Running
Running
File size: 1,463 Bytes
33adc14 527151b 33adc14 527151b 33adc14 527151b 33adc14 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 |
retriever:
retriever_hf_paths:
RAGatouille: "XThomasBU/Colbert_Index"
metadata:
metadata_links:
[
"https://dl4ds.github.io/sp2025/",
"https://dl4ds.github.io/sp2025/schedule/",
]
slide_base_link:
"https://dl4ds.github.io"
# Assignment base link is used to find the webpage where the assignment is described/posted
assignment_base_link: "https://tools4ds.github.io/fa2024/assignments/"
# Define content types - assignments, lectures, etc.
content_types:
- "lectures"
- "assignments"
- "discussion"
- "other"
# These need to be patterns from URLs that can be used to identify the type of content uniquely
lectures_pattern: "/lectures/"
assignments_pattern: "/assignments/"
discussion_pattern: "/discussion/"
project_pattern: "/project/"
# These are fields that can be extracted from the webpages of the course content
lecture_metadata_fields:
- "title"
- "tldr"
- "date"
- "lecture_recording"
- "suggested_readings"
assignment_metadata_fields:
- "title"
- "release_date"
- "due_date"
- "source_file"
token_config:
cooldown_time: 60
regen_time: 180
tokens_left: 50000
all_time_tokens_allocated: 1000000
content:
notebookheaders_to_split_on:
- ["##", "Section"]
- ["#", "Title"]
misc:
github_repo: "https://github.com/edubotics-ai/edubot-core"
docs_website: "https://dl4ds.github.io/dl4ds_tutor/"
api_config:
timeout: 60
|