|
89 | 89 |
|
90 | 90 | # After this join we have all of the possible sales nations |
91 | 91 | df_regional_customers = df_regional_customers.join( |
92 | | - df_nation, (["r_regionkey"], ["n_regionkey"]), how="inner" |
| 92 | + df_nation, left_on=["r_regionkey"], right_on=["n_regionkey"], how="inner" |
93 | 93 | ) |
94 | 94 |
|
95 | 95 | # Now find the possible customers |
96 | 96 | df_regional_customers = df_regional_customers.join( |
97 | | - df_customer, (["n_nationkey"], ["c_nationkey"]), how="inner" |
| 97 | + df_customer, left_on=["n_nationkey"], right_on=["c_nationkey"], how="inner" |
98 | 98 | ) |
99 | 99 |
|
100 | 100 | # Next find orders for these customers |
101 | 101 | df_regional_customers = df_regional_customers.join( |
102 | | - df_orders, (["c_custkey"], ["o_custkey"]), how="inner" |
| 102 | + df_orders, left_on=["c_custkey"], right_on=["o_custkey"], how="inner" |
103 | 103 | ) |
104 | 104 |
|
105 | 105 | # Find all line items from these orders |
106 | 106 | df_regional_customers = df_regional_customers.join( |
107 | | - df_lineitem, (["o_orderkey"], ["l_orderkey"]), how="inner" |
| 107 | + df_lineitem, left_on=["o_orderkey"], right_on=["l_orderkey"], how="inner" |
108 | 108 | ) |
109 | 109 |
|
110 | 110 | # Limit to the part of interest |
111 | 111 | df_regional_customers = df_regional_customers.join( |
112 | | - df_part, (["l_partkey"], ["p_partkey"]), how="inner" |
| 112 | + df_part, left_on=["l_partkey"], right_on=["p_partkey"], how="inner" |
113 | 113 | ) |
114 | 114 |
|
115 | 115 | # Compute the volume for each line item |
|
126 | 126 |
|
127 | 127 | # Determine the suppliers by the limited nation key we have in our single row df above |
128 | 128 | df_national_suppliers = df_national_suppliers.join( |
129 | | - df_supplier, (["n_nationkey"], ["s_nationkey"]), how="inner" |
| 129 | + df_supplier, left_on=["n_nationkey"], right_on=["s_nationkey"], how="inner" |
130 | 130 | ) |
131 | 131 |
|
132 | 132 | # When we join to the customer dataframe, we don't want to confuse other columns, so only |
|
141 | 141 | # column only from suppliers in the nation we are evaluating. |
142 | 142 |
|
143 | 143 | df = df_regional_customers.join( |
144 | | - df_national_suppliers, (["l_suppkey"], ["s_suppkey"]), how="left" |
| 144 | + df_national_suppliers, left_on=["l_suppkey"], right_on=["s_suppkey"], how="left" |
145 | 145 | ) |
146 | 146 |
|
147 | 147 | # Use a case statement to compute the volume sold by suppliers in the nation of interest |
|
0 commit comments