-
Notifications
You must be signed in to change notification settings - Fork 11
/
Copy pathutils.py
31 lines (22 loc) · 1.07 KB
/
utils.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
# Get numeric columns
import snowflake.snowpark as snowpark
import streamlit as st
# import snowflake.snowpark.functions as F
import snowflake.snowpark.types as T
def describeSnowparkDF(snowpark_df: snowpark.DataFrame):
st.write("Here's some stats about the loaded data:")
numeric_types = [T.DecimalType, T.LongType, T.DoubleType, T.FloatType, T.IntegerType]
numeric_columns = [c.name for c in snowpark_df.schema.fields if type(c.datatype) in numeric_types]
# Get categorical columns
categorical_types = [T.StringType]
categorical_columns = [c.name for c in snowpark_df.schema.fields if type(c.datatype) in categorical_types]
st.write("Relational schema:")
columns = [c for c in snowpark_df.schema.fields]
st.write(columns)
col1, col2, = st.columns(2)
with col1:
st.write('Numeric columns:\t', numeric_columns)
with col2:
st.write('Categorical columns:\t', categorical_columns)
# Calculte statistics for our dataset
st.dataframe(snowpark_df.describe().sort('SUMMARY'), use_container_width=True)