Sales Table

align-center

Products Table

from pyspark.sql import SparkSession
from pyspark.sql.functions import broadcast

# Initialize the Spark session
spark = SparkSession.builder.appName("Broadcast Join Example").getOrCreate()

# Create DataFrames from sample data
sales_data = [(1, 101, 2), (2, 102, 1), (3, 103, 3), (4, 101, 1), (5, 104, 4)]
products_data = [(101, "Learn C++", 10), (102, "Mobile: X1", 20), (103, "LCD", 30), (104, "Laptop", 40)]

sales_columns = ["order_id", "product_id", "quantity"]
products_columns = ["product_id", "product_name", "price"]

sales_df = spark.createDataFrame(sales_data, schema=sales_columns)
products_df = spark.createDataFrame(products_data, schema=products_columns)

# Perform broadcast join
result = sales_df.join(broadcast(products_df), sales_df["product_id"] == products_df["product_id"])

# Show result
result.show()

import React from 'react';
import { shallow, configure } from 'enzyme';
import Adapter from 'enzyme-adapter-react-16';

configure({ adapter: new Adapter() });

import HelloWorld from './app';

var TestResult = function() {
    this.succeeded = false;
    this.reason = "";
    this.input = "";
    this.expected_output = "";
    this.actual_output = "";
}

export const executeTests = function() {

  var results = [];

  result = new TestResult();
  result.input = 'HelloWorld Component';
  result.expected_output = "span containing text 'Hello World'"

  let wrapper = shallow(<HelloWorld />);

  // Call your Challenge function here.

  let type = wrapper.type();
  let testSuccessful = true;
  let failureReason;

  if (type !== 'span') {
    testSuccessful = false;
    failureReason = "You need to render exactly one span HTML element";
  } else if (wrapper.props().children != "Hello World") {
     testSuccessful = false;
     failureReason = "You have rendered wrong message in your span element";
  }

  result.actual_output = wrapper.html();

  if (testSuccessful) {
    result.succeeded = true;
    result.reason = "Succeeded"
  } else {
    result.succeeded = false;
    result.reason = failureReason;
  }

  results.push(result);

  return results;
}


What is PySpark broadcast join?

Sales Table

Products Table

Explanation

Sales Table

order_id	product_id	product_id
1	101	2
2	102	1
3	103	3
4	101	1
5	104	4

product_id	product_name	price
101	Learn C++	910
102	Mobile: X1	14000
103	LCD	8000
104	Laptop	25000

order_id	product_id	quantity	product_id	product_name	price
1	101	2	101	Learn C++	10
2	102	1	102	Mobile: X1	20
3	103	3	103	LCD	30
4	101	1	101	Learn C++	10
5	104	4	104	Laptop	40