johnometalman commited on
Commit
8ce1706
·
1 Parent(s): 81dcf19

exploration of datasets

Browse files
.gitignore CHANGED
@@ -1,2 +1,2 @@
1
  venv/
2
- dataset.py
 
1
  venv/
2
+ notebook.ipynb
app.py CHANGED
@@ -1,26 +1,29 @@
1
  import streamlit as st
2
  import pandas as pd
3
- import kagglehub
4
- import zipfile
5
- import os
6
 
7
  st.title('Dashboard de Venture Capital')
8
  st.markdown('Demo portafolio de Machine Learning y Venture Capital')
9
 
10
- # Download latest version
11
- path = kagglehub.dataset_download("sashakorovkina/4808-techstars-backed-companies-in-2024", path="./datasets/")
 
 
 
12
 
13
- # # Unzip the dataset (if compressed)
14
- # with zipfile.ZipFile(path, 'r') as zip_ref:
15
- # zip_ref.extractall("./datasets")
16
 
17
- # Load CSV into a DataFrame
18
- csv_path = "./datasets/sashakorovkina/4808-techstars-backed-companies-in-2024.csv"
19
- df = pd.read_csv(csv_path)
20
 
21
- # Display DataFrame in Streamlit
22
- st.write(df.head())
 
 
23
 
 
 
24
 
25
- # Sidebar and Filter
26
- st.sidebar.write("Opciones para Filtro")
 
1
  import streamlit as st
2
  import pandas as pd
3
+
 
 
4
 
5
  st.title('Dashboard de Venture Capital')
6
  st.markdown('Demo portafolio de Machine Learning y Venture Capital')
7
 
8
+ # Load CSV into a DataFrame
9
+ data = "./datasets/companies.csv"
10
+ data = pd.read_csv(data)
11
+
12
+ df = pd.DataFrame(data)
13
 
14
+ # Get the column names for segmented control (e.g., 'Status' column)
15
+ filters = df.columns.tolist() # This will give a list of column names in the dataframe
 
16
 
17
+ # Add the segmented control widget to let the user choose a filter
18
+ selected_filter = st.sidebar.segmented_control("Select a column to filter", filters)
 
19
 
20
+ # Based on the selected filter, display options for filtering
21
+ if selected_filter:
22
+ unique_values = df[selected_filter].unique().tolist()
23
+ selected_value = st.sidebar.selectbox(f"Select value to filter by {selected_filter}", unique_values)
24
 
25
+ # Filter the dataframe based on the selected value
26
+ filtered_df = df[df[selected_filter] == selected_value]
27
 
28
+ # Display the filtered dataframe
29
+ st.write(filtered_df)
datasets/companies.csv ADDED
The diff for this file is too large to render. See raw diff
 
datasets/industries.csv ADDED
The diff for this file is too large to render. See raw diff
 
datasets/program_names.csv ADDED
The diff for this file is too large to render. See raw diff
 
requirements.txt CHANGED
@@ -1,2 +1 @@
1
- streamlit
2
- kagglehub
 
1
+ streamlit