Skip to content

Commit

Permalink
cleanup examples
Browse files Browse the repository at this point in the history
  • Loading branch information
milenkovicm committed Dec 8, 2024
1 parent 87e6298 commit ab38e6a
Show file tree
Hide file tree
Showing 4 changed files with 39 additions and 9 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -16,16 +16,8 @@
# under the License.

# %%

from ballista import BallistaBuilder
from datafusion.context import SessionContext

# Ballista will initiate with an empty config
# set config variables with `config`
# ctx: SessionContext = BallistaBuilder()\
# .config("ballista.job.name", "example ballista")\
# .config("ballista.shuffle.partitions", "16")\
# .standalone()

ctx: SessionContext = BallistaBuilder().remote("df://127.0.0.1:50050")

Expand Down
File renamed without changes.
38 changes: 38 additions & 0 deletions python/examples/readme_remote.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,38 @@
# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied. See the License for the
# specific language governing permissions and limitations
# under the License.

# %%

from ballista import BallistaBuilder
from datafusion.context import SessionContext

ctx: SessionContext = BallistaBuilder()\
.config("ballista.job.name", "Readme Example Remote")\
.config("datafusion.execution.target_partitions", "4")\
.remote("df://127.0.0.1:50050")

ctx.sql("create external table t stored as parquet location '../testdata/test.parquet'")

# %%
df = ctx.sql("select * from t limit 5")
pyarrow_batches = df.collect()
pyarrow_batches[0].to_pandas()
# %%
df = ctx.read_parquet('../testdata/test.parquet').limit(5)
pyarrow_batches = df.collect()
pyarrow_batches[0].to_pandas()
# %%
Original file line number Diff line number Diff line change
Expand Up @@ -21,7 +21,7 @@
from datafusion.context import SessionContext

ctx: SessionContext = BallistaBuilder()\
.config("ballista.job.name", "Readme Examples")\
.config("ballista.job.name", "Readme Example")\
.config("datafusion.execution.target_partitions", "4")\
.standalone()

Expand Down

0 comments on commit ab38e6a

Please sign in to comment.