bash
pip install dpark
yaml
master_host: <master_ip_address>
master_port: <master_port_number>
python
from dpark import DparkContext
def sum_numbers(numbers):
return sum(numbers)
if __name__ == "__main__":
dpark_context = DparkContext()
data = range(1, 1001)
result = dpark_context.parallelize(data).map(sum_numbers).reduce(lambda x, y: x + y)
print("Sum:", result)
bash
python distributed_computing.py