Walker数据集
数据帧
Pandas
import gwalkr as gwk
import pandas as pd
df = pd.read_csv("data.csv")
walker = gwk.walk(df)
Polars
import gwalkr as gwk
import polars as pl
df = pl.read_csv("data.csv")
walker = gwk.walk(df)
Modin
import gwalkr as gwk
import modin.pandas as mpd
df = mpd.read_csv("data.csv")
walker = gwk.walk(df)
数据库
连接器代码
from gwalkr.data_parsers.database_parser import Connector
conn = Connector(
"snowflake://username:password@host/database/schema",
"""
SELECT
*
FROM
XXX
"""
)
连接器参数
参数 | 类型 | 默认值 | 描述 |
---|---|---|---|
url | str | - | 请参考SQLAlchemy文档中的url。示例:mysql+pymysql://user:password@host:port/database |
view_sql | str | - | view sql,示例:SELECT * FROM table_name |
engine_params | Optional[Dict[str, Any]] | None | 引擎参数,请参考SQLAlchemy文档中的参数。示例:{"pool_size": 10} |
Snowflake
from gwalkr.data_parsers.database_parser import Connector
import gwalkr as gwk
conn = Connector(
"snowflake://username:password@host/database/schema",
"""
SELECT
*
FROM
XXX
"""
)
walker = gwk.walk(conn)
Postgres
from gwalkr.data_parsers.database_parser import Connector
import gwalkr as gwk
conn = Connector(
"postgresql+psycopg2://username:password@host:port/database",
"""
SELECT
*
FROM
XXX
"""
)
walker = gwk.walk(conn)
其他数据库
理论上,它支持SQLAlchemy支持的所有数据库。
请参考SQLAlchemy文档并安装相应数据库的驱动程序。