Skip to content

Commit c063e5f

Browse files
authored
Replacing the dataset for h2o sample_script to fix tests (#1258)
1 parent 6f517b2 commit c063e5f

File tree

1 file changed

+3
-8
lines changed

1 file changed

+3
-8
lines changed

h2o/sample-script.py

Lines changed: 3 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -5,10 +5,9 @@
55
spark = SparkSession.builder.appName("SparklingWaterApp").getOrCreate()
66
hc = H2OContext.getOrCreate()
77

8-
bucket = "h2o-bq-large-dataset"
9-
train_path = "demos/cc_train.csv"
10-
test_path = "demos/cc_test.csv"
11-
y = "DEFAULT_PAYMENT_NEXT_MONTH"
8+
bucket = "h2o-bq-large-dataset-1"
9+
train_path = "demos/prostate.csv"
10+
y = "CAPSULE"
1211
is_classification = True
1312

1413
drop_cols = []
@@ -17,13 +16,9 @@
1716
train_data = spark.read\
1817
.options(header='true', inferSchema='true')\
1918
.csv("gs://{}/{}".format(bucket, train_path))
20-
test_data = spark.read\
21-
.options(header='true', inferSchema='true')\
22-
.csv("gs://{}/{}".format(bucket, test_path))
2319

2420
print("CREATING H2O FRAME")
2521
training_frame = hc.asH2OFrame(train_data)
26-
test_frame = hc.asH2OFrame(test_data)
2722

2823
x = training_frame.columns
2924
x.remove(y)

0 commit comments

Comments
 (0)