Hi,
If you want to read a file from gcs directly
1) use google cloud storage library to download
bucket_name = 'facile-tmp-data'
file = 'mailchimp-mailchimp_campagne.json'
import google.cloud.storage as storage
storage_client = storage.Client()
bucket = storage_client.get_bucket(bucket_name)
blob = bucket.blob(file)
#content = blob.download_as_string()
blob.download_to_filename('/tmp/campagin.json')
....
2) use built in gcs io in tensorflow.
Tensorflow is already installed in composer
from tensorflow.python.lib.io import file_io
import pandas as pd
def fetch_as_dataframe(path) -> pd.DataFrame:
with file_io.FileIO(path, 'r') as f:
if ".json" in path:
df = pd.read_json(f, lines=True)
else:
df = pd.read_csv(f)
return df
fetch_as_dataframe('gs://facile-tmp-data/mailchimp-mailchimp_campagne.json')