You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

get_data.py 442 B

12345678910111213141516
  1. import os
  2. import pandas as pd
  3. def get_data(data_root="./data"):
  4. dtrain = pd.read_csv(os.path.join(data_root, "train.csv"))
  5. dtest = pd.read_csv(os.path.join(data_root, "test.csv"))
  6. # returned X(DataFrame), y(Series)
  7. return (
  8. dtrain[["discourse_text", "discourse_type"]],
  9. dtrain["discourse_effectiveness"],
  10. dtest[["discourse_text", "discourse_type"]],
  11. dtest["discourse_effectiveness"],
  12. )