VerticaPy

Python API for Vertica Data Science at Scale

Joins

When working with datasets, we often need to merge data from different sources. To do this, we need keys on which to join our data.

Let's use the US Flights 2015 datasets. We have three datasets.

First, we have information on each flight.

In [57]:
import verticapy as vp
flights  = vp.read_csv("data/flights.csv")
display(flights)
123
YEAR
Int
123
MONTH
Int
123
DAY
Int
123
DAY_OF_WEEK
Int
Abc
AIRLINE
Varchar(20)
123
FLIGHT_NUMBER
Int
Abc
TAIL_NUMBER
Varchar(20)
Abc
ORIGIN_AIRPORT
Varchar(20)
Abc
DESTINATION_AIRPORT
Varchar(20)
123
SCHEDULED_DEPARTURE
Int
123
DEPARTURE_TIME
Int
123
DEPARTURE_DELAY
Int
123
TAXI_OUT
Int
123
WHEELS_OFF
Int
123
SCHEDULED_TIME
Int
123
ELAPSED_TIME
Int
123
AIR_TIME
Int
123
DISTANCE
Int
123
WHEELS_ON
Int
123
TAXI_IN
Int
123
SCHEDULED_ARRIVAL
Int
123
ARRIVAL_TIME
Int
123
ARRIVAL_DELAY
Int
123
DIVERTED
Int
123
CANCELLED
Int
Abc
CANCELLATION_REASON
Varchar(20)
123
AIR_SYSTEM_DELAY
Int
123
SECURITY_DELAY
Int
123
AIRLINE_DELAY
Int
123
LATE_AIRCRAFT_DELAY
Int
123
WEATHER_DELAY
Int
12015114AA1N787AAJFKLAX900855-51791239040237824751230712301237700[null][null][null][null][null][null]
22015114AA2N795AALAXJFK900856-41691233529527124751643817351651-4400[null][null][null][null][null][null]
32015114AA3N798AAJFKLAX12301226-419124538038235824751543515501548-200[null][null][null][null][null][null]
42015114AA4N799AALAXJFK12201214-6231237330319284247520211220502033-1700[null][null][null][null][null][null]
52015114AA5N376AADFWHNL130517542892118155155264993784223461740224030000[null]110197920
62015114AA6N398AAOGGDFW1805[null][null][null][null]425[null][null]3711[null][null]510[null][null]01A[null][null][null][null][null]
72015114AA7N398AADFWOGG121515131782415375005174903711194731635195019500[null]17017800
82015114AA8N368AAHNLDFW1745193310815194844544642037846481151065910900[null]1001080
92015114AA9N792AAJFKLAX700649-112271138039736824751019710201026600[null][null][null][null][null][null]
102015114AA10N796AALAXJFK21502150014220430929427524755395559544-1500[null][null][null][null][null][null]
112015114AA12N792AALAXJFK11151114-1191133335321287247519201519501935-1500[null][null][null][null][null][null]
122015114AA14N5ERAAOGGLAX23002254-6122306305289267248653310605543-2200[null][null][null][null][null][null]
132015114AA15N783AAJFKSFO800755-557852400453388258612208114012284800[null]480000
142015114AA16N783AASFOJFK12451316311813343303333052586213910211521493400[null]300310
152015114AA17N019AAATLMIA700656-415711112106825948339852842-1000[null][null][null][null][null][null]
162015114AA19N786AAJFKLAX11001055-517111238037835424751406714201413-700[null][null][null][null][null][null]
172015114AA20N789AASFOJFK15001503319152232532830125862323823252331600[null][null][null][null][null][null]
182015114AA21N795AAJFKLAX1845185162919203854073682475222810221022382800[null]220600
192015114AA22N786AALAXJFK15151512-3231535320317277247523121723352329-600[null][null][null][null][null][null]
202015114AA23N371AADFWSFO755841463591623023319014641026894510344900[null]304600
212015114AA23N371AASFODFW10501123332811512102171781464164911162017004000[null]700330
222015114AA24N784AASFOJFK720714-62073434033230725861541516001546-1400[null][null][null][null][null][null]
232015114AA25N3AVAABOSLAX900857-31591239540538126111233912351242700[null][null][null][null][null][null]
242015114AA27N5DUAADFWLAS1850192939161945175165141105520068194520142900[null]002900
252015114AA28N358AALAXMIA15001456-4191515290305284234222592225023011100[null][null][null][null][null][null]
262015114AA29N455AAONTDFW122513569125142117521714911881850431720193313300[null]4209100
272015114AA29N568AADFWONT1035[null][null][null][null]190[null][null]1188[null][null]1145[null][null]01B[null][null][null][null][null]
282015114AA30N795AALAXJFK23302326-423234932029927024757196750725-2500[null][null][null][null][null][null]
292015114AA31N5ESAALAXHNL8058282312840365362346255612264121012302000[null]002000
302015114AA32N794AALAXJFK141514249141438325315288247522261322402239-100[null][null][null][null][null][null]
312015114AA35N3ALAADFWHDN11101109-1111120145178111769121156123513073200[null]320000
322015114AA35N3ALAAHDNDFW1320140040111411135130109769170010163517103500[null]007280
332015114AA36N3EKAASANDFW935928-713941170172140117114011914251420-500[null][null][null][null][null][null]
342015114AA37N483AADFWSAN21002103318212118518716611712207322052210500[null][null][null][null][null][null]
352015114AA40N3BYAADCAORD9559550910041301261116121055611051101-400[null][null][null][null][null][null]
362015114AA41N3KEAAORDSEA20552054-11621102702932361721230641232523472200[null]220000
372015114AA42N3GPAASEAORD850849-11690523522420117211426714451433-1200[null][null][null][null][null][null]
382015114AA43N3BNAADFWDTW1030[null][null][null][null]150[null][null]986[null][null]1400[null][null]01B[null][null][null][null][null]
392015114AA43N3KCAADTWDFW144514450191504180199163986164717164517041900[null]190000
402015114AA44N3AJAALASJFK810803-71782029527224822481528716051535-3000[null][null][null][null][null][null]
412015114AA45N3ELAAJFKLAS17291727-221174835534731822482006820242014-1000[null][null][null][null][null][null]
422015114AA46N3CSAASJCORD725725013738255253226182913241413401338-200[null][null][null][null][null][null]
432015114AA47N3KSAAORDSJC1915203580182053280261238182922515215522566100[null]000610
442015114AA48N3JXAASANDFW835830-513843175164141117113041013301314-1600[null][null][null][null][null][null]
452015114AA49N5ELAADFWSAN1935200631152021185178160117121013204021042400[null]002400
462015114AA50N570AASLCDFW81582493690016517913498912149120012232300[null]140900
472015114AA51N471AADFWSLC17252035190242059170161130989220971915221618100[null]00221590
482015114AA52N3LMAALAXDCA12251222-318124029027925323111953820152001-1400[null][null][null][null][null][null]
492015114AA53N3LHAADCALAX840838-21285036035033123111121711401128-1200[null][null][null][null][null][null]
502015114AA54N3CWAALASORD910906-41692221519317015141412714451419-2600[null][null][null][null][null][null]
512015114AA55N3JJAAORDLAS1820192464131937230225205151421027201021095900[null]005900
522015114AA58N5DFAAKOALAX1400140002214223103202762504205822211021201000[null][null][null][null][null][null]
532015114AA59N5DFAALAXKOA840837-31785435035233225041226312301229-100[null][null][null][null][null][null]
542015114AA60N372AADFWMIA175419551211520101601511331121232332134232611200[null]0011200
552015114AA61N850AAMIADFW715719413732199192167112191912934931-300[null][null][null][null][null][null]
562015114AA63N3ECAAMIAPHX19501955523201831730227119722249823072257-1000[null][null][null][null][null][null]
572015114AA64N3HXAADFWJFK102510411613105420018716913911443514451448300[null][null][null][null][null][null]
582015114AA65N3HLAAJFKDFW16151625101916442552942271391193148193020194900[null]3901000
592015114AA66N631AASJUJFK11511142-922120424524722115981445414561449-700[null][null][null][null][null][null]
602015114AA67N631AAJFKSJU160516292423165223521118215982054621002100000[null][null][null][null][null][null]
612015114AA68N5EGAASFOMIA70070331471732431729525851512815241520-400[null][null][null][null][null][null]
622015114AA69N3HTAAMIASFO18351836112184838635934225852130522012135-2600[null][null][null][null][null][null]
632015114AA70N5BTAASANDFW705659-622721180171137117111381212051150-1500[null][null][null][null][null][null]
642015114AA71N3GHAADFWSAN18051803-214181718017616011711857219051859-600[null][null][null][null][null][null]
652015114AA72N5EKAADFWMCO6006066186241451421209859244925928300[null][null][null][null][null][null]
662015114AA72N5EKAAMCODFW10201015-516103117517114398511541212151206-900[null][null][null][null][null][null]
672015114AA73N3FBAAPHLCLT1005957-8261023120108764491139612051145-2000[null][null][null][null][null][null]
682015114AA74N488AACLEDFW15551552-311160319018116110211744918051753-1200[null][null][null][null][null][null]
692015114AA74N505AADFWCLE1145[null][null][null][null]150[null][null]1021[null][null]1515[null][null]01B[null][null][null][null][null]
702015114AA75N3HPAAIADLAX18301822-817183936035833522882114621302120-1000[null][null][null][null][null][null]
712015114AA76N3HPAALAXIAD950946-418100428526524322881707417351711-2400[null][null][null][null][null][null]
722015114AA76N3HPAASFOLAX730723-71573885974933782733855900500[null][null][null][null][null][null]
732015114AA79N520AADFWSMF2140221939302249225224188143123576232533800[null]000380
742015114AA80N4XTAATUSDFW1655174146101751130130105813203615200520514600[null]000460
752015114AA81N4XCAADFWTUS22452308231323211401401238132445282300[null]000230
762015114AA83N4XBAAMCODFW735733-21674918017414698591512935927-800[null][null][null][null][null][null]
772015114AA84N3AXAABOSJFK940930-10159457569461871031810551039-1600[null][null][null][null][null][null]
782015114AA84N3AXAAJFKBOS7307344177517065441878354840839-100[null][null][null][null][null][null]
792015114AA85N785AAJFKSFO15301524-620154440038636125861845519101850-2000[null][null][null][null][null][null]
802015114AA86N3GTAAPDXORD705701-41571623523020817391244713001251-900[null][null][null][null][null][null]
812015114AA87N490AAORDRNO18451840-511185126522821316712024421102028-4200[null][null][null][null][null][null]
822015114AA89N3KVAAIAHMIA520618581963714113711196492878419355400[null]005400
832015114AA92N3KHAASANORD90090001591524021018917231424615001430-3000[null][null][null][null][null][null]
842015114AA93N3HHAAORDSAN1720180545101815255222210172319452193519471200[null][null][null][null][null][null]
852015114AA94N3ANAASANJFK755810151382332028126224461545616151551-2400[null][null][null][null][null][null]
862015114AA95N3ANAAJFKSAN1720174929181807380386363244621105204021153500[null]602900
872015114AA96N553AADFWSTL82083111218529594705501002395510051000[null][null][null][null][null][null]
882015114AA96N553AASTLDFW103510511615110611513198550124418123013023200[null]1606100
892015114AA97N3ENAADCADFW845842-314856215210185119211011111201112-800[null][null][null][null][null][null]
902015114AA99N3KMAAORDPDX15501553311160427525323917391803318251806-1900[null][null][null][null][null][null]
912015114AA102N376AAHNLDFW1920235627617134454454173784111011645112127600[null]0002760
922015114AA103N4XSAADFWMSY141014332313144680806244715485153015532300[null]002300
932015114AA103N4XSAAMSYDFW16101624148163210091744471746917501755500[null][null][null][null][null][null]
942015114AA110N3LRAASNAORD805801-47808230211194172613221013551332-2300[null][null][null][null][null][null]
952015114AA111N3LYAAORDSNA17201719-111173026023722217261912419401916-2400[null][null][null][null][null][null]
962015114AA112N857AADENMIA101510172191036224229199170915551115591606700[null][null][null][null][null][null]
972015114AA113N3GRAAMIADEN211521150212136269269235170923311323442344000[null][null][null][null][null][null]
982015114AA115N3CTAALAXMIA105103-21411728627625523428327851839-1200[null][null][null][null][null][null]
992015114AA116N383AAOGGDFW1955201621102026430433418371172457057292400[null]302100
1002015114AA117N793AAJFKLAX14451438-728150639038935524751801618151807-800[null][null][null][null][null][null]
Rows: 1-100 | Columns: 31

Second, we have information on each airport.

In [58]:
airports = vp.read_csv("data/airports.csv")
display(airports)
Abc
IATA_CODE
Varchar(20)
Abc
Varchar(156)
Abc
CITY
Varchar(60)
Abc
STATE
Varchar(20)
Abc
COUNTRY
Varchar(20)
🌎
LATITUDE
Numeric(10,6)
🌎
LONGITUDE
Numeric(11,6)
1ABEAllentownPAUSA40.65236-75.4404
2ABIAbileneTXUSA32.41132-99.6819
3ABQAlbuquerqueNMUSA35.04022-106.60919
4ABRAberdeenSDUSA45.44906-98.42183
5ABYAlbanyGAUSA31.53552-84.19447
6ACKNantucketMAUSA41.25305-70.06018
7ACTWacoTXUSA31.61129-97.23052
8ACVArcata/EurekaCAUSA40.97812-124.10862
9ACYAtlantic CityNJUSA39.45758-74.57717
10ADKAdakAKUSA51.87796-176.64603
11ADQKodiakAKUSA57.74997-152.49386
12AEXAlexandriaLAUSA31.32737-92.54856
13AGSAugustaGAUSA33.36996-81.9645
14AKNKing SalmonAKUSA58.6768-156.64922
15ALBAlbanyNYUSA42.74812-73.80298
16ALOWaterlooIAUSA42.55708-92.40034
17AMAAmarilloTXUSA35.21937-101.70593
18ANCAnchorageAKUSA61.17432-149.99619
19APNAlpenaMIUSA45.07807-83.56029
20ASEAspenCOUSA39.22316-106.86885
21ATLAtlantaGAUSA33.64044-84.42694
22ATWAppletonWIUSA44.25741-88.51948
23AUSAustinTXUSA30.19453-97.66987
24AVLAshevilleNCUSA35.43619-82.54181
25AVPWilkes-Barre/ScrantonPAUSA41.33815-75.72427
26AZOKalamazooMIUSA42.23488-85.55206
27BDLWindsor LocksCTUSA41.93887-72.68323
28BETBethelAKUSA60.77978-161.838
29BFLBakersfieldCAUSA35.4336-119.05677
30BGMBinghamtonNYUSA42.20848-75.97961
31BGRBangorMEUSA44.80744-68.82814
32BHMBirminghamALUSA33.56294-86.75355
33BILBillingsMTUSA45.80766-108.54286
34BISBismarckNDUSA46.77411-100.74672
35BJIBemidjiMNUSA47.50942-94.93372
36BLIBellinghamWAUSA48.79275-122.53753
37BMIBloomingtonILUSA40.47799-88.91595
38BNANashvilleTNUSA36.12448-86.67818
39BOIBoiseIDUSA43.56444-116.22278
40BOSBostonMAUSA42.36435-71.00518
41BPTBeaumont/Port ArthurTXUSA29.95083-94.02069
42BQKBrunswickGAUSA31.25903-81.46631
43BQNAguadillaPRUSA18.49486-67.12944
44BRDBrainerdMNUSA46.39786-94.13723
45BROBrownsvilleTXUSA25.90683-97.42586
46BRWBarrowAKUSA71.28545-156.766
47BTMButteMTUSA45.9548-112.49746
48BTRBaton RougeLAUSA30.53316-91.14963
49BTVBurlingtonVTUSA44.473-73.15031
50BUFBuffaloNYUSA42.94052-78.73217
51BURBurbankCAUSA34.20062-118.3585
52BWIBaltimoreMDUSA39.1754-76.6682
53BZNBozemanMTUSA45.7769-111.15301
54CAEColumbiaSCUSA33.93884-81.11954
55CAKAkronOHUSA40.91631-81.44247
56CDCCedar CityUTUSA37.70097-113.09858
57CDVCordovaAKUSA60.49183-145.47765
58CECCrescent CityCAUSA41.78016-124.23653
59CHAChattanoogaTNUSA35.03527-85.20379
60CHOCharlottesvilleVAUSA38.13864-78.45286
61CHSCharlestonSCUSA32.89865-80.04051
62CIDCedar RapidsIAUSA41.88459-91.71087
63CIUSault Ste. MarieMIUSA46.25075-84.47239