fix bugs due to tf2 release (#447)

TheMichaelHu · web-flow · commit 63184378840d · 2020-04-17T09:59:18.000-07:00
diff --git a/examples/cloudml-collaborative-filtering/README.md b/examples/cloudml-collaborative-filtering/README.md
@@ -26,12 +26,19 @@ Create a new project on GCP and set up GCP credentials:
 gcloud auth login
 gcloud auth application-default login
 ```
+
+Enable the following APIS:
+- [Dataflow](http://console.cloud.google.com/apis/api/dataflow.googleapis.com)
+- [AI Platform](http://console.cloud.google.com/apis/api/ml.googleapis.com)
+
 Using the `preprocessing/config.example.ini` template, create
 `preprocessing/config.ini` with the GCP project id fields filled in.
+Additionally, you will need to create a GCS bucket. This code assumes a bucket
+exists by the name of `[project-id]-bucket`.
 
 Set up your python environment:
 ```shell
-virtualenv venv -p python3
+python3 -m venv venv
 source ./venv/bin/activate
 pip install -r requirements.txt
 ```
@@ -113,7 +120,8 @@ Model training can be monitored on Tensorboard using the following command:
 tensorboard --logdir <path to model dir>/<trial number>
 ```
 Tensorboard's projector, in particular, is very useful for debugging
-or analyzing embeddings.
+or analyzing embeddings. In the projector tab in Tensorboard, try setting the
+label to `name`.
 
 ## Serving
 Models can be hosted on CAIP, which can be used to make online and batch predictions via JSON requests.
diff --git a/examples/cloudml-collaborative-filtering/bin/run.predict.cloud.sh b/examples/cloudml-collaborative-filtering/bin/run.predict.cloud.sh
@@ -22,6 +22,11 @@
 #   TRIAL (optional): The trial number to use.
 . ./bin/_common.sh
 
+if [ "$#" -lt 1 ]; then
+  echo "Illegal number of parameters. Should be >= 1, given $#."
+  exit 1
+fi
+
 MODEL_OUTPUTS_DIR=$1
 TRIAL=${2:-${DEFAULT_TRIAL}}
 
diff --git a/examples/cloudml-collaborative-filtering/bin/run.serve.cloud.sh b/examples/cloudml-collaborative-filtering/bin/run.serve.cloud.sh
@@ -22,6 +22,11 @@
 #   TRIAL (optional): The trial number to use.
 . ./bin/_common.sh
 
+if [ "$#" -lt 1 ]; then
+  echo "Illegal number of parameters. Should be >= 1, given $#."
+  exit 1
+fi
+
 MODEL_OUTPUTS_DIR=$1
 TRIAL=${2:-${DEFAULT_TRIAL}}
 
diff --git a/examples/cloudml-collaborative-filtering/bin/run.train.cloud.sh b/examples/cloudml-collaborative-filtering/bin/run.train.cloud.sh
@@ -21,6 +21,11 @@
 #                     This should just be a timestamp.
 . ./bin/_common.sh
 
+if [ "$#" -lt 1 ]; then
+  echo "Illegal number of parameters. Should be >= 1, given $#."
+  exit 1
+fi
+
 MODEL_INPUTS_DIR=$1
 
 NOW="$(get_date_time)"
@@ -37,13 +42,13 @@ gcloud ai-platform jobs submit training "${TRAINING_JOB_NAME}" \
   --staging-bucket "${OUTPUT_BUCKET}" \
   --package-path trainer \
   --region us-east1 \
-  --runtime-version 1.13 \
+  --runtime-version 1.15 \
   --scale-tier "${SCALE_TIER}" \
   -- \
   --model_dir "${MODEL_PATH}" \
   --input_dir "${INPUT_PATH}" \
   --tft_dir "${TFT_PATH}" \
-  --max_steps 300000 \
+  --max_steps 100000 \
   --batch_size 512 \
   --user_embed_mult 1.5 \
   --item_embed_mult 1 \
diff --git a/examples/cloudml-collaborative-filtering/bin/run.train.local.sh b/examples/cloudml-collaborative-filtering/bin/run.train.local.sh
@@ -21,6 +21,11 @@
 #                     This should just be a timestamp.
 . ./bin/_common.sh
 
+if [ "$#" -lt 1 ]; then
+  echo "Illegal number of parameters. Should be >= 1, given $#."
+  exit 1
+fi
+
 MODEL_INPUTS_DIR=$1
 
 PROJECT_ID="$(get_project_id)"
diff --git a/examples/cloudml-collaborative-filtering/preprocessing/config.example.ini b/examples/cloudml-collaborative-filtering/preprocessing/config.example.ini
@@ -4,7 +4,7 @@ runner = DataflowRunner
 max_num_workers = 5
 defaultWorkerLogLevel = INFO
 log_level = ERROR
-zone = us-east1-b
+region = us-east1
 
 [LOCAL]
 project = [GCP_PROJECT_ID]
diff --git a/examples/cloudml-collaborative-filtering/preprocessing/run_preprocess.py b/examples/cloudml-collaborative-filtering/preprocessing/run_preprocess.py
@@ -107,7 +107,7 @@ def get_pipeline_options(args, config):
             "../setup.py")),
         "staging_location": os.path.join(args.job_dir, "staging"),
         "temp_location": os.path.join(args.job_dir, "tmp"),
-        "zone": config.get("zone")
+        "region": config.get("region"),
     })
   pipeline_options = beam.pipeline.PipelineOptions(flags=[], **options)
   return pipeline_options
diff --git a/examples/cloudml-collaborative-filtering/requirements.txt b/examples/cloudml-collaborative-filtering/requirements.txt
@@ -1,9 +1,9 @@
- apache-beam[gcp]>=2.13.0
- configparser>=3.7.4
- google-api-core>=1.13.0
- google-api-python-client>=1.7.9
- google-cloud-core>=1.0.2
- nose>=1.3.7
- tensorflow>=1.14.0
- tensorflow-transform>=0.13.0
-
+apache-beam[gcp]>=2.16.0
+configparser>=3.7.4
+google-api-core>=1.13.0
+google-api-python-client>=1.7.9
+google-cloud-core>=1.0.2
+nose>=1.3.7
+tensorboard==1.15.0
+tensorflow>=0.15.0,<2.0.0
+tensorflow-transform==0.21.2
diff --git a/examples/cloudml-collaborative-filtering/trainer/model.py b/examples/cloudml-collaborative-filtering/trainer/model.py
@@ -20,8 +20,8 @@
 import json
 import os
 
+from tensorboard.plugins import projector
 import tensorflow as tf
-from tensorflow.contrib.tensorboard.plugins import projector
 import tensorflow_transform as tft
 
 # pylint: disable=g-bad-import-order
diff --git a/examples/cloudml-collaborative-filtering/trainer/utils.py b/examples/cloudml-collaborative-filtering/trainer/utils.py
@@ -71,8 +71,8 @@ def write_projector_metadata(metadata_dir, tft_dir):
                                               constants.NUM_PROJECTOR_ITEMS)
   metadata = user_metadata + item_metadata
   metadata_path = os.path.join(metadata_dir, constants.PROJECTOR_PATH)
-  tf.gfile.MakeDirs(metadata_dir)
-  with tf.gfile.GFile(metadata_path, "w+") as f:
+  tf.io.gfile.makedirs(metadata_dir)
+  with tf.io.gfile.GFile(metadata_path, "w+") as f:
     f.write("label\tname\n")
-    f.write("\n".join(["\t".join(sample) for sample in metadata]))
+    f.write("\n".join(["{}\t{}".format(label, name) for label, name in metadata]))
   return user_indices, item_indices