Bruno Canal
06/06/2021, 12:47 AMmsg="path not found" func="pkg/gateway/operations.(*HeadObject).Handle" file="build/pkg/gateway/operations/headobject.go:30" host="<http://s3.local.lakefs.io:8000|s3.local.lakefs.io:8000>" method=HEAD path=.spark-staging-2d639c01-addd-4495-91a1-37ef56187e69/ ref=develop repository=customers request_id=f7da0575-3295-4fc2-90d0-ba6bb1c96b83 service_name=s3_gateway user=admin
many times....Can someone help me?Bruno Canal
06/06/2021, 12:48 AMfrom pyspark.sql import SparkSession
def spark_session():
spark: SparkSession = SparkSession \
.builder \
.master('local[1]') \
.appName('lakefs') \
.config('spark.jars', '../resources/jars/hadoop-aws-3.2.0.jar, ../resources/jars/aws-java-sdk-bundle-1.11.375.jar') \
.getOrCreate()
spark.sparkContext._jsc.hadoopConfiguration().set('fs.s3a.access.key', 'AKIAJYCCHHXD5F3I3NDQ')
spark.sparkContext._jsc.hadoopConfiguration().set('fs.s3a.secret.key', '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')
spark.sparkContext._jsc.hadoopConfiguration().set('fs.s3a.endpoint', '<http://s3.local.lakefs.io:8000>')
spark.sparkContext._jsc.hadoopConfiguration().set("fs.s3a.path.style.access", "true")
return spark
def main():
spark = spark_session()
df = spark.createDataFrame([(3, 'bern'), (4, 'raf'), (6, 'brun')], ['id', 'value'])
repo = "customers"
branch = "develop"
path = f's3a://{repo}/{branch}'
print(f'writing to {path}')
df.write.mode('overwrite').parquet(path)
print('finished')
spark.stop()
main()
Tal Sofer
06/06/2021, 1:04 AMBruno Canal
06/06/2021, 1:21 AMTal Sofer
06/06/2021, 1:52 AMBruno Canal
06/06/2021, 10:44 AMTal Sofer
06/06/2021, 10:45 AMTal Sofer
06/06/2021, 10:45 AMBruno Canal
06/06/2021, 10:46 AMBruno Canal
06/06/2021, 10:49 AMBruno Canal
06/06/2021, 10:50 AMTal Sofer
06/06/2021, 10:51 AMBruno Canal
06/06/2021, 10:51 AMTal Sofer
06/06/2021, 10:56 AMBruno Canal
06/06/2021, 11:00 AMTal Sofer
06/06/2021, 11:01 AMTal Sofer
06/06/2021, 11:32 AMBruno Canal
06/06/2021, 11:33 AMTal Sofer
06/06/2021, 11:35 AMBruno Canal
06/06/2021, 11:42 AMBruno Canal
06/06/2021, 11:42 AMlisten_address: "0.0.0.0:8000"
logging:
format: text
level: DEBUG
output: "-"
database:
connection_string: "<postgres://lakefs>:lakefs@<DATABASE IP>)/postgres?sslmode=disable"
auth:
encrypt:
secret_key: "lakefs"
blockstore:
type: gs
gs:
credentials_file: "/home/lakefs/.credentials.json"
gateways:
s3:
domain_name: "<http://s3.local.lakefs.io:8000|s3.local.lakefs.io:8000>"
Bruno Canal
06/06/2021, 11:45 AMdocker run \
--name lakefs \
-p 8000:8000 \
--network bridge \
-v $(pwd)/lakefs-config.yaml:/home/lakefs/.lakefs.yaml \
-v $(pwd)/credentials.json:/home/lakefs/.credentials.json \
treeverse/lakefs:0.41.1 run
Tal Sofer
06/06/2021, 11:57 AMTal Sofer
06/06/2021, 12:00 PMBruno Canal
06/06/2021, 12:04 PMTal Sofer
06/06/2021, 12:18 PM