diff --git a/.github/workflows/ci.yaml b/.github/workflows/ci.yaml index b482fddb..c1cd28bc 100644 --- a/.github/workflows/ci.yaml +++ b/.github/workflows/ci.yaml @@ -82,4 +82,4 @@ jobs: run: pip install uv && uv pip install --system ".[dev]" - name: Run tests - run: nbdev_test --timing --do_print --n_workers 0 --skip_file_re "computing_at_scale|distributed" + run: nbdev_test --timing --do_print --n_workers 0 --skip_file_re "computing_at_scale|distributed" \ No newline at end of file diff --git a/nbs/assets/arima_rst.csv b/nbs/assets/arima_rst.csv new file mode 100644 index 00000000..564a3405 --- /dev/null +++ b/nbs/assets/arima_rst.csv @@ -0,0 +1,197 @@ +,unique_id,ds,AutoARIMA +0,FOODS_1,2016-04-25,2567.6380220997385 +1,FOODS_1,2016-04-26,2640.0126507600617 +2,FOODS_1,2016-04-27,2654.020161270193 +3,FOODS_1,2016-04-28,2796.440947432241 +4,FOODS_1,2016-04-29,3208.3811781219893 +5,FOODS_1,2016-04-30,3773.861663861278 +6,FOODS_1,2016-05-01,3299.79743620078 +7,FOODS_1,2016-05-02,2640.917833365884 +8,FOODS_1,2016-05-03,2694.336636469822 +9,FOODS_1,2016-05-04,2694.1035608286916 +10,FOODS_1,2016-05-05,2835.3163066249176 +11,FOODS_1,2016-05-06,3236.293019356992 +12,FOODS_1,2016-05-07,3797.241666185409 +13,FOODS_1,2016-05-08,3321.3663551719346 +14,FOODS_1,2016-05-09,2657.5206296593224 +15,FOODS_1,2016-05-10,2707.524732902354 +16,FOODS_1,2016-05-11,2704.747898679939 +17,FOODS_1,2016-05-12,2843.9075334840127 +18,FOODS_1,2016-05-13,3243.2271452721875 +19,FOODS_1,2016-05-14,3802.8383176295374 +20,FOODS_1,2016-05-15,3325.8835081296597 +21,FOODS_1,2016-05-16,2661.1665009534677 +22,FOODS_1,2016-05-17,2710.4673778864567 +23,FOODS_1,2016-05-18,2707.1229576998144 +24,FOODS_1,2016-05-19,2845.8244841791743 +25,FOODS_1,2016-05-20,3244.7743489150994 +26,FOODS_1,2016-05-21,3804.0870921121996 +27,FOODS_1,2016-05-22,3326.8914153406417 +28,FOODS_2,2016-04-25,5247.139313835306 +29,FOODS_2,2016-04-26,4792.960953564678 +30,FOODS_2,2016-04-27,4590.964924105041 +31,FOODS_2,2016-04-28,4600.860960731239 +32,FOODS_2,2016-04-29,4942.967875785429 +33,FOODS_2,2016-04-30,6337.5344008647035 +34,FOODS_2,2016-05-01,6757.903656868389 +35,FOODS_2,2016-05-02,5607.448278542931 +36,FOODS_2,2016-05-03,5244.736379588703 +37,FOODS_2,2016-05-04,5004.324139775963 +38,FOODS_2,2016-05-05,4898.957821332703 +39,FOODS_2,2016-05-06,5310.50858073175 +40,FOODS_2,2016-05-07,6641.501751486881 +41,FOODS_2,2016-05-08,6994.60266694966 +42,FOODS_2,2016-05-09,5779.319357423172 +43,FOODS_2,2016-05-10,5407.162676474501 +44,FOODS_2,2016-05-11,5083.913842178118 +45,FOODS_2,2016-05-12,4944.398003219373 +46,FOODS_2,2016-05-13,5311.376375871703 +47,FOODS_2,2016-05-14,6593.071399563353 +48,FOODS_2,2016-05-15,6919.214380455565 +49,FOODS_2,2016-05-16,5687.59113569716 +50,FOODS_2,2016-05-17,5289.695188706264 +51,FOODS_2,2016-05-18,4961.060422560739 +52,FOODS_2,2016-05-19,4815.1162421391555 +53,FOODS_2,2016-05-20,5184.318070407874 +54,FOODS_2,2016-05-21,6467.664979048176 +55,FOODS_2,2016-05-22,6807.52592255971 +56,FOODS_3,2016-04-25,17666.731556718732 +57,FOODS_3,2016-04-26,16540.541376421595 +58,FOODS_3,2016-04-27,16160.633071055223 +59,FOODS_3,2016-04-28,16370.683658640599 +60,FOODS_3,2016-04-29,17889.869101221244 +61,FOODS_3,2016-04-30,22332.436097780206 +62,FOODS_3,2016-05-01,22713.044590532798 +63,FOODS_3,2016-05-02,17468.426315986457 +64,FOODS_3,2016-05-03,16293.254187261948 +65,FOODS_3,2016-05-04,15975.967829497 +66,FOODS_3,2016-05-05,16301.448695311468 +67,FOODS_3,2016-05-06,17742.192012594733 +68,FOODS_3,2016-05-07,22149.920466723906 +69,FOODS_3,2016-05-08,22672.51910973226 +70,FOODS_3,2016-05-09,17388.755964833897 +71,FOODS_3,2016-05-10,16229.554742510712 +72,FOODS_3,2016-05-11,15913.853788834986 +73,FOODS_3,2016-05-12,16229.441847880662 +74,FOODS_3,2016-05-13,17695.119173018684 +75,FOODS_3,2016-05-14,22118.38914081269 +76,FOODS_3,2016-05-15,22622.383902927766 +77,FOODS_3,2016-05-16,17352.915739873653 +78,FOODS_3,2016-05-17,16196.863301084244 +79,FOODS_3,2016-05-18,15886.258449760904 +80,FOODS_3,2016-05-19,16208.436163712715 +81,FOODS_3,2016-05-20,17673.61997937043 +82,FOODS_3,2016-05-21,22097.648256558292 +83,FOODS_3,2016-05-22,22608.340998500338 +84,HOBBIES_1,2016-04-25,3301.1184614493914 +85,HOBBIES_1,2016-04-26,3190.0305707575 +86,HOBBIES_1,2016-04-27,3199.935172884026 +87,HOBBIES_1,2016-04-28,3225.695752897986 +88,HOBBIES_1,2016-04-29,3567.265955094044 +89,HOBBIES_1,2016-04-30,4356.224282294094 +90,HOBBIES_1,2016-05-01,4089.925888720474 +91,HOBBIES_1,2016-05-02,3256.234765934616 +92,HOBBIES_1,2016-05-03,3167.254279226249 +93,HOBBIES_1,2016-05-04,3182.164242104323 +94,HOBBIES_1,2016-05-05,3197.8208347975133 +95,HOBBIES_1,2016-05-06,3562.1759714192 +96,HOBBIES_1,2016-05-07,4348.942474784928 +97,HOBBIES_1,2016-05-08,4062.088166835995 +98,HOBBIES_1,2016-05-09,3270.411197190324 +99,HOBBIES_1,2016-05-10,3153.9826259751076 +100,HOBBIES_1,2016-05-11,3185.763508441231 +101,HOBBIES_1,2016-05-12,3215.5124943559786 +102,HOBBIES_1,2016-05-13,3557.0053751276196 +103,HOBBIES_1,2016-05-14,4347.883194155448 +104,HOBBIES_1,2016-05-15,4072.703812696276 +105,HOBBIES_1,2016-05-16,3257.5290353634405 +106,HOBBIES_1,2016-05-17,3160.8541642155105 +107,HOBBIES_1,2016-05-18,3181.513304571057 +108,HOBBIES_1,2016-05-19,3202.9504121022114 +109,HOBBIES_1,2016-05-20,3559.2179367013387 +110,HOBBIES_1,2016-05-21,4348.099858357742 +111,HOBBIES_1,2016-05-22,4064.243078853568 +112,HOBBIES_2,2016-04-25,372.73314373276685 +113,HOBBIES_2,2016-04-26,394.9539049862272 +114,HOBBIES_2,2016-04-27,383.16517087090995 +115,HOBBIES_2,2016-04-28,383.62499302365416 +116,HOBBIES_2,2016-04-29,398.311355639119 +117,HOBBIES_2,2016-04-30,394.347605737723 +118,HOBBIES_2,2016-05-01,410.1164983512131 +119,HOBBIES_2,2016-05-02,381.5187849900045 +120,HOBBIES_2,2016-05-03,390.5415783971641 +121,HOBBIES_2,2016-05-04,384.30591664608176 +122,HOBBIES_2,2016-05-05,382.0656727697983 +123,HOBBIES_2,2016-05-06,391.0787416473706 +124,HOBBIES_2,2016-05-07,388.7836691251789 +125,HOBBIES_2,2016-05-08,393.876028907937 +126,HOBBIES_2,2016-05-09,390.2092112439395 +127,HOBBIES_2,2016-05-10,389.2354081364607 +128,HOBBIES_2,2016-05-11,388.6840382471152 +129,HOBBIES_2,2016-05-12,388.2380749588003 +130,HOBBIES_2,2016-05-13,387.8486951350242 +131,HOBBIES_2,2016-05-14,387.50441758710645 +132,HOBBIES_2,2016-05-15,387.19942014913687 +133,HOBBIES_2,2016-05-16,386.9291391176742 +134,HOBBIES_2,2016-05-17,386.6896116476871 +135,HOBBIES_2,2016-05-18,386.4773369473272 +136,HOBBIES_2,2016-05-19,386.28921406142393 +137,HOBBIES_2,2016-05-20,386.12249505879066 +138,HOBBIES_2,2016-05-21,385.9747446856811 +139,HOBBIES_2,2016-05-22,385.84380476581924 +140,HOUSEHOLD_1,2016-04-25,7401.891643264893 +141,HOUSEHOLD_1,2016-04-26,6713.059783961793 +142,HOUSEHOLD_1,2016-04-27,6568.574826414228 +143,HOUSEHOLD_1,2016-04-28,6780.766120981868 +144,HOUSEHOLD_1,2016-04-29,7572.471090810987 +145,HOUSEHOLD_1,2016-04-30,9760.255572651784 +146,HOUSEHOLD_1,2016-05-01,9626.516172187357 +147,HOUSEHOLD_1,2016-05-02,7339.549091656914 +148,HOUSEHOLD_1,2016-05-03,6715.501042329869 +149,HOUSEHOLD_1,2016-05-04,6588.688826450386 +150,HOUSEHOLD_1,2016-05-05,6792.018975120889 +151,HOUSEHOLD_1,2016-05-06,7585.826196179538 +152,HOUSEHOLD_1,2016-05-07,9784.576440586516 +153,HOUSEHOLD_1,2016-05-08,9625.229656671552 +154,HOUSEHOLD_1,2016-05-09,7370.017398852801 +155,HOUSEHOLD_1,2016-05-10,6703.274498285182 +156,HOUSEHOLD_1,2016-05-11,6599.658566441017 +157,HOUSEHOLD_1,2016-05-12,6803.892952779315 +158,HOUSEHOLD_1,2016-05-13,7578.147413631544 +159,HOUSEHOLD_1,2016-05-14,9797.63840894531 +160,HOUSEHOLD_1,2016-05-15,9618.004359773748 +161,HOUSEHOLD_1,2016-05-16,7369.325267410535 +162,HOUSEHOLD_1,2016-05-17,6704.177617699504 +163,HOUSEHOLD_1,2016-05-18,6602.321156728928 +164,HOUSEHOLD_1,2016-05-19,6806.125635799577 +165,HOUSEHOLD_1,2016-05-20,7579.715540310798 +166,HOUSEHOLD_1,2016-05-21,9800.535564906138 +167,HOUSEHOLD_1,2016-05-22,9618.816928719863 +168,HOUSEHOLD_2,2016-04-25,1944.6365790975688 +169,HOUSEHOLD_2,2016-04-26,1782.1136284351692 +170,HOUSEHOLD_2,2016-04-27,1783.3160335243492 +171,HOUSEHOLD_2,2016-04-28,1843.7479525740052 +172,HOUSEHOLD_2,2016-04-29,2017.7306193648328 +173,HOUSEHOLD_2,2016-04-30,2573.4319970333827 +174,HOUSEHOLD_2,2016-05-01,2555.781560345023 +175,HOUSEHOLD_2,2016-05-02,1911.5887343314832 +176,HOUSEHOLD_2,2016-05-03,1773.6009268551322 +177,HOUSEHOLD_2,2016-05-04,1783.737933427243 +178,HOUSEHOLD_2,2016-05-05,1836.4433591054317 +179,HOUSEHOLD_2,2016-05-06,2026.2345730343163 +180,HOUSEHOLD_2,2016-05-07,2599.273470339867 +181,HOUSEHOLD_2,2016-05-08,2547.324959977864 +182,HOUSEHOLD_2,2016-05-09,1919.6860442557204 +183,HOUSEHOLD_2,2016-05-10,1772.1267493740079 +184,HOUSEHOLD_2,2016-05-11,1776.2903338158771 +185,HOUSEHOLD_2,2016-05-12,1836.0676051839982 +186,HOUSEHOLD_2,2016-05-13,2012.270429155826 +187,HOUSEHOLD_2,2016-05-14,2570.3606621455087 +188,HOUSEHOLD_2,2016-05-15,2548.3296441260773 +189,HOUSEHOLD_2,2016-05-16,1906.4143149755678 +190,HOUSEHOLD_2,2016-05-17,1767.280129446266 +191,HOUSEHOLD_2,2016-05-18,1776.7401745381599 +192,HOUSEHOLD_2,2016-05-19,1830.4754939798 +193,HOUSEHOLD_2,2016-05-20,2018.588737506113 +194,HOUSEHOLD_2,2016-05-21,2589.769743131061 +195,HOUSEHOLD_2,2016-05-22,2541.838195247957 diff --git a/nbs/assets/lgbm_rst.csv b/nbs/assets/lgbm_rst.csv new file mode 100644 index 00000000..144ca90c --- /dev/null +++ b/nbs/assets/lgbm_rst.csv @@ -0,0 +1,197 @@ +,unique_id,ds,AutoLightGBM +0,FOODS_1,2016-04-25,2694.6738511439944 +1,FOODS_1,2016-04-26,2805.230420439614 +2,FOODS_1,2016-04-27,2662.0380598102083 +3,FOODS_1,2016-04-28,2645.027003376193 +4,FOODS_1,2016-04-29,3236.588718297946 +5,FOODS_1,2016-04-30,3747.51371444864 +6,FOODS_1,2016-05-01,3172.307149809725 +7,FOODS_1,2016-05-02,2657.3513449500338 +8,FOODS_1,2016-05-03,2691.9787279391626 +9,FOODS_1,2016-05-04,2746.2863197867673 +10,FOODS_1,2016-05-05,2762.255340569623 +11,FOODS_1,2016-05-06,3257.194144588295 +12,FOODS_1,2016-05-07,3799.031472854631 +13,FOODS_1,2016-05-08,3252.8382373569984 +14,FOODS_1,2016-05-09,2786.334069555473 +15,FOODS_1,2016-05-10,2820.205574835855 +16,FOODS_1,2016-05-11,2762.5056712532564 +17,FOODS_1,2016-05-12,2786.88595237666 +18,FOODS_1,2016-05-13,3309.4905882795897 +19,FOODS_1,2016-05-14,3796.0201508972023 +20,FOODS_1,2016-05-15,3273.3752810082988 +21,FOODS_1,2016-05-16,2742.19182422212 +22,FOODS_1,2016-05-17,2823.468902301943 +23,FOODS_1,2016-05-18,2854.8557474617855 +24,FOODS_1,2016-05-19,2871.135690726362 +25,FOODS_1,2016-05-20,3331.1931287348802 +26,FOODS_1,2016-05-21,3781.1473608863216 +27,FOODS_1,2016-05-22,3405.544149448268 +28,FOODS_2,2016-04-25,5120.102523686289 +29,FOODS_2,2016-04-26,5185.27038248254 +30,FOODS_2,2016-04-27,5115.111348340718 +31,FOODS_2,2016-04-28,4619.394726238464 +32,FOODS_2,2016-04-29,5432.537671232106 +33,FOODS_2,2016-04-30,6025.41273018486 +34,FOODS_2,2016-05-01,6220.986523247984 +35,FOODS_2,2016-05-02,4964.5749171463885 +36,FOODS_2,2016-05-03,5103.670724855448 +37,FOODS_2,2016-05-04,5144.3979512523165 +38,FOODS_2,2016-05-05,5218.996763184711 +39,FOODS_2,2016-05-06,5439.347347215497 +40,FOODS_2,2016-05-07,5865.1687497733365 +41,FOODS_2,2016-05-08,6368.92258946046 +42,FOODS_2,2016-05-09,5186.848082254273 +43,FOODS_2,2016-05-10,4880.374441261076 +44,FOODS_2,2016-05-11,4909.098152984957 +45,FOODS_2,2016-05-12,5081.108905626409 +46,FOODS_2,2016-05-13,5407.15017000438 +47,FOODS_2,2016-05-14,5830.236827339688 +48,FOODS_2,2016-05-15,6618.276011160659 +49,FOODS_2,2016-05-16,5242.077035682606 +50,FOODS_2,2016-05-17,5003.983891141501 +51,FOODS_2,2016-05-18,4958.840167821236 +52,FOODS_2,2016-05-19,4762.949855746844 +53,FOODS_2,2016-05-20,5389.750344472496 +54,FOODS_2,2016-05-21,5942.651453698519 +55,FOODS_2,2016-05-22,6269.243619511553 +56,FOODS_3,2016-04-25,17711.385739545563 +57,FOODS_3,2016-04-26,16357.865618151673 +58,FOODS_3,2016-04-27,16557.86563355973 +59,FOODS_3,2016-04-28,16163.752858976526 +60,FOODS_3,2016-04-29,18881.115214451296 +61,FOODS_3,2016-04-30,23092.123636884276 +62,FOODS_3,2016-05-01,23294.58207237022 +63,FOODS_3,2016-05-02,17732.312728761386 +64,FOODS_3,2016-05-03,16215.758103512571 +65,FOODS_3,2016-05-04,16609.186712046285 +66,FOODS_3,2016-05-05,17115.71866090232 +67,FOODS_3,2016-05-06,18163.574602023327 +68,FOODS_3,2016-05-07,22698.015289239014 +69,FOODS_3,2016-05-08,22955.84590815469 +70,FOODS_3,2016-05-09,17924.510549950868 +71,FOODS_3,2016-05-10,16652.368043668524 +72,FOODS_3,2016-05-11,16706.713769910348 +73,FOODS_3,2016-05-12,17070.997700996042 +74,FOODS_3,2016-05-13,18438.390974654023 +75,FOODS_3,2016-05-14,22698.015289239014 +76,FOODS_3,2016-05-15,22955.84590815469 +77,FOODS_3,2016-05-16,18333.211272508892 +78,FOODS_3,2016-05-17,16812.741370928095 +79,FOODS_3,2016-05-18,16706.713769910348 +80,FOODS_3,2016-05-19,16479.679299243857 +81,FOODS_3,2016-05-20,18502.532285923797 +82,FOODS_3,2016-05-21,22698.015289239014 +83,FOODS_3,2016-05-22,22955.84590815469 +84,HOBBIES_1,2016-04-25,3226.027840439743 +85,HOBBIES_1,2016-04-26,3195.3648189304345 +86,HOBBIES_1,2016-04-27,3172.479599244583 +87,HOBBIES_1,2016-04-28,3215.297092249357 +88,HOBBIES_1,2016-04-29,3550.478555688749 +89,HOBBIES_1,2016-04-30,4315.818469198181 +90,HOBBIES_1,2016-05-01,4321.600390227421 +91,HOBBIES_1,2016-05-02,3157.8276654934016 +92,HOBBIES_1,2016-05-03,3208.8238007824716 +93,HOBBIES_1,2016-05-04,3171.402461945512 +94,HOBBIES_1,2016-05-05,3122.93302254743 +95,HOBBIES_1,2016-05-06,3534.892640584684 +96,HOBBIES_1,2016-05-07,4261.123354991392 +97,HOBBIES_1,2016-05-08,4296.069679132532 +98,HOBBIES_1,2016-05-09,3273.3972145241705 +99,HOBBIES_1,2016-05-10,3221.5792680507666 +100,HOBBIES_1,2016-05-11,3200.345723427872 +101,HOBBIES_1,2016-05-12,3245.4991334325614 +102,HOBBIES_1,2016-05-13,3568.3027303655 +103,HOBBIES_1,2016-05-14,4320.567307842713 +104,HOBBIES_1,2016-05-15,4343.116200412291 +105,HOBBIES_1,2016-05-16,3289.762766694878 +106,HOBBIES_1,2016-05-17,3267.984449690506 +107,HOBBIES_1,2016-05-18,3200.345723427872 +108,HOBBIES_1,2016-05-19,3208.1360951146366 +109,HOBBIES_1,2016-05-20,3615.44813501723 +110,HOBBIES_1,2016-05-21,4326.047999208027 +111,HOBBIES_1,2016-05-22,4344.900175442336 +112,HOBBIES_2,2016-04-25,339.77407251192693 +113,HOBBIES_2,2016-04-26,397.4010613540528 +114,HOBBIES_2,2016-04-27,382.61025056378617 +115,HOBBIES_2,2016-04-28,393.55441552694975 +116,HOBBIES_2,2016-04-29,412.81304016665115 +117,HOBBIES_2,2016-04-30,416.1985117603962 +118,HOBBIES_2,2016-05-01,467.8505902120062 +119,HOBBIES_2,2016-05-02,359.72499730411994 +120,HOBBIES_2,2016-05-03,400.9547760594411 +121,HOBBIES_2,2016-05-04,384.0621884160096 +122,HOBBIES_2,2016-05-05,384.0621884160096 +123,HOBBIES_2,2016-05-06,412.81304016665115 +124,HOBBIES_2,2016-05-07,405.2543467972324 +125,HOBBIES_2,2016-05-08,467.8505902120062 +126,HOBBIES_2,2016-05-09,380.6591071937099 +127,HOBBIES_2,2016-05-10,400.9547760594411 +128,HOBBIES_2,2016-05-11,400.9547760594411 +129,HOBBIES_2,2016-05-12,400.9547760594411 +130,HOBBIES_2,2016-05-13,412.81304016665115 +131,HOBBIES_2,2016-05-14,416.1985117603962 +132,HOBBIES_2,2016-05-15,467.8505902120062 +133,HOBBIES_2,2016-05-16,390.6243107525114 +134,HOBBIES_2,2016-05-17,411.89894102260484 +135,HOBBIES_2,2016-05-18,400.9547760594411 +136,HOBBIES_2,2016-05-19,400.9547760594411 +137,HOBBIES_2,2016-05-20,412.81304016665115 +138,HOBBIES_2,2016-05-21,416.1985117603962 +139,HOBBIES_2,2016-05-22,467.8505902120062 +140,HOUSEHOLD_1,2016-04-25,7160.832175743806 +141,HOUSEHOLD_1,2016-04-26,6971.744965808053 +142,HOUSEHOLD_1,2016-04-27,6676.608231213473 +143,HOUSEHOLD_1,2016-04-28,6640.7455196004885 +144,HOUSEHOLD_1,2016-04-29,7565.152447398786 +145,HOUSEHOLD_1,2016-04-30,9465.935601433835 +146,HOUSEHOLD_1,2016-05-01,9702.66861697589 +147,HOUSEHOLD_1,2016-05-02,7205.825513464553 +148,HOUSEHOLD_1,2016-05-03,7113.679030081171 +149,HOUSEHOLD_1,2016-05-04,6649.31399566832 +150,HOUSEHOLD_1,2016-05-05,6674.348708680196 +151,HOUSEHOLD_1,2016-05-06,7697.496157413757 +152,HOUSEHOLD_1,2016-05-07,9399.00971175823 +153,HOUSEHOLD_1,2016-05-08,9439.07736476184 +154,HOUSEHOLD_1,2016-05-09,7493.79860897777 +155,HOUSEHOLD_1,2016-05-10,7002.1844984992185 +156,HOUSEHOLD_1,2016-05-11,6661.775405589411 +157,HOUSEHOLD_1,2016-05-12,6764.480000367033 +158,HOUSEHOLD_1,2016-05-13,7598.947495707824 +159,HOUSEHOLD_1,2016-05-14,9399.00971175823 +160,HOUSEHOLD_1,2016-05-15,9439.07736476184 +161,HOUSEHOLD_1,2016-05-16,7534.459703980786 +162,HOUSEHOLD_1,2016-05-17,7229.353310975897 +163,HOUSEHOLD_1,2016-05-18,6699.882771137218 +164,HOUSEHOLD_1,2016-05-19,6764.480000367033 +165,HOUSEHOLD_1,2016-05-20,7697.496157413757 +166,HOUSEHOLD_1,2016-05-21,9399.00971175823 +167,HOUSEHOLD_1,2016-05-22,9314.773035693921 +168,HOUSEHOLD_2,2016-04-25,1891.769292418806 +169,HOUSEHOLD_2,2016-04-26,1805.813605315031 +170,HOUSEHOLD_2,2016-04-27,1758.0613497523343 +171,HOUSEHOLD_2,2016-04-28,1800.1115326528136 +172,HOUSEHOLD_2,2016-04-29,1959.4740469519804 +173,HOUSEHOLD_2,2016-04-30,2660.449142902388 +174,HOUSEHOLD_2,2016-05-01,2619.654508404448 +175,HOUSEHOLD_2,2016-05-02,1839.0080089551213 +176,HOUSEHOLD_2,2016-05-03,1829.4970368277027 +177,HOUSEHOLD_2,2016-05-04,1823.5007626046254 +178,HOUSEHOLD_2,2016-05-05,1811.520891959066 +179,HOUSEHOLD_2,2016-05-06,1977.7038269928182 +180,HOUSEHOLD_2,2016-05-07,2816.242000429492 +181,HOUSEHOLD_2,2016-05-08,2634.914005288675 +182,HOUSEHOLD_2,2016-05-09,1878.4366945999661 +183,HOUSEHOLD_2,2016-05-10,1815.8433855980848 +184,HOUSEHOLD_2,2016-05-11,1811.1689759986775 +185,HOUSEHOLD_2,2016-05-12,1811.520891959066 +186,HOUSEHOLD_2,2016-05-13,1977.7038269928182 +187,HOUSEHOLD_2,2016-05-14,2753.4834680201943 +188,HOUSEHOLD_2,2016-05-15,2586.938159190155 +189,HOUSEHOLD_2,2016-05-16,1857.353491565642 +190,HOUSEHOLD_2,2016-05-17,1829.4970368277027 +191,HOUSEHOLD_2,2016-05-18,1811.520891959066 +192,HOUSEHOLD_2,2016-05-19,1811.520891959066 +193,HOUSEHOLD_2,2016-05-20,1977.7038269928182 +194,HOUSEHOLD_2,2016-05-21,2861.6326484548927 +195,HOUSEHOLD_2,2016-05-22,2645.9665234893946 diff --git a/nbs/assets/nhits_rst.csv b/nbs/assets/nhits_rst.csv new file mode 100644 index 00000000..99e3f9d1 --- /dev/null +++ b/nbs/assets/nhits_rst.csv @@ -0,0 +1,197 @@ +unique_id,ds,NHITS +FOODS_1,2016-04-25,2504.762 +FOODS_1,2016-04-26,2467.719 +FOODS_1,2016-04-27,2430.538 +FOODS_1,2016-04-28,2545.7861 +FOODS_1,2016-04-29,3158.0547 +FOODS_1,2016-04-30,3675.847 +FOODS_1,2016-05-01,3220.2334 +FOODS_1,2016-05-02,2603.3481 +FOODS_1,2016-05-03,2549.2483 +FOODS_1,2016-05-04,2526.7446 +FOODS_1,2016-05-05,2656.253 +FOODS_1,2016-05-06,3305.013 +FOODS_1,2016-05-07,3765.003 +FOODS_1,2016-05-08,3275.3057 +FOODS_1,2016-05-09,2697.433 +FOODS_1,2016-05-10,2621.8018 +FOODS_1,2016-05-11,2528.0818 +FOODS_1,2016-05-12,2711.9429 +FOODS_1,2016-05-13,3265.7722 +FOODS_1,2016-05-14,3737.7068 +FOODS_1,2016-05-15,3250.004 +FOODS_1,2016-05-16,2663.8232 +FOODS_1,2016-05-17,2565.505 +FOODS_1,2016-05-18,2516.273 +FOODS_1,2016-05-19,2611.7502 +FOODS_1,2016-05-20,3218.6646 +FOODS_1,2016-05-21,3715.1863 +FOODS_1,2016-05-22,3209.3425 +FOODS_2,2016-04-25,5217.8647 +FOODS_2,2016-04-26,4537.3613 +FOODS_2,2016-04-27,4325.717 +FOODS_2,2016-04-28,4522.6455 +FOODS_2,2016-04-29,5086.342 +FOODS_2,2016-04-30,6492.3867 +FOODS_2,2016-05-01,7200.9097 +FOODS_2,2016-05-02,6160.0244 +FOODS_2,2016-05-03,5388.8823 +FOODS_2,2016-05-04,5440.1694 +FOODS_2,2016-05-05,5520.1226 +FOODS_2,2016-05-06,6055.701 +FOODS_2,2016-05-07,7401.1245 +FOODS_2,2016-05-08,7905.652 +FOODS_2,2016-05-09,6759.285 +FOODS_2,2016-05-10,5789.94 +FOODS_2,2016-05-11,5636.6777 +FOODS_2,2016-05-12,5507.3813 +FOODS_2,2016-05-13,5849.2007 +FOODS_2,2016-05-14,7064.666 +FOODS_2,2016-05-15,7434.761 +FOODS_2,2016-05-16,6070.2705 +FOODS_2,2016-05-17,5095.434 +FOODS_2,2016-05-18,4870.112 +FOODS_2,2016-05-19,4596.719 +FOODS_2,2016-05-20,4982.272 +FOODS_2,2016-05-21,6231.084 +FOODS_2,2016-05-22,6697.241 +FOODS_3,2016-04-25,17230.807 +FOODS_3,2016-04-26,15789.233 +FOODS_3,2016-04-27,15369.597 +FOODS_3,2016-04-28,15617.65 +FOODS_3,2016-04-29,18008.902 +FOODS_3,2016-04-30,23040.523 +FOODS_3,2016-05-01,23571.592 +FOODS_3,2016-05-02,18340.871 +FOODS_3,2016-05-03,16562.752 +FOODS_3,2016-05-04,16747.717 +FOODS_3,2016-05-05,17052.62 +FOODS_3,2016-05-06,19778.832 +FOODS_3,2016-05-07,24705.719 +FOODS_3,2016-05-08,24711.145 +FOODS_3,2016-05-09,19328.555 +FOODS_3,2016-05-10,17409.87 +FOODS_3,2016-05-11,17146.104 +FOODS_3,2016-05-12,16995.588 +FOODS_3,2016-05-13,19478.918 +FOODS_3,2016-05-14,24267.672 +FOODS_3,2016-05-15,24103.676 +FOODS_3,2016-05-16,18767.125 +FOODS_3,2016-05-17,16687.102 +FOODS_3,2016-05-18,16438.53 +FOODS_3,2016-05-19,15937.973 +FOODS_3,2016-05-20,18391.8 +FOODS_3,2016-05-21,23098.781 +FOODS_3,2016-05-22,23017.9 +HOBBIES_1,2016-04-25,3293.069 +HOBBIES_1,2016-04-26,3175.8167 +HOBBIES_1,2016-04-27,3104.7383 +HOBBIES_1,2016-04-28,3130.194 +HOBBIES_1,2016-04-29,3652.3372 +HOBBIES_1,2016-04-30,4440.7046 +HOBBIES_1,2016-05-01,4260.2666 +HOBBIES_1,2016-05-02,3375.5198 +HOBBIES_1,2016-05-03,3186.3364 +HOBBIES_1,2016-05-04,3148.969 +HOBBIES_1,2016-05-05,3190.6125 +HOBBIES_1,2016-05-06,3787.1 +HOBBIES_1,2016-05-07,4503.3115 +HOBBIES_1,2016-05-08,4216.017 +HOBBIES_1,2016-05-09,3309.7373 +HOBBIES_1,2016-05-10,3130.4082 +HOBBIES_1,2016-05-11,3052.7866 +HOBBIES_1,2016-05-12,3083.465 +HOBBIES_1,2016-05-13,3624.693 +HOBBIES_1,2016-05-14,4420.6533 +HOBBIES_1,2016-05-15,4138.2466 +HOBBIES_1,2016-05-16,3327.1152 +HOBBIES_1,2016-05-17,3115.9226 +HOBBIES_1,2016-05-18,3068.1096 +HOBBIES_1,2016-05-19,3066.814 +HOBBIES_1,2016-05-20,3670.4724 +HOBBIES_1,2016-05-21,4458.9883 +HOBBIES_1,2016-05-22,4195.486 +HOBBIES_2,2016-04-25,359.69662 +HOBBIES_2,2016-04-26,337.56714 +HOBBIES_2,2016-04-27,336.36066 +HOBBIES_2,2016-04-28,346.82523 +HOBBIES_2,2016-04-29,385.13193 +HOBBIES_2,2016-04-30,448.0414 +HOBBIES_2,2016-05-01,428.58112 +HOBBIES_2,2016-05-02,347.9329 +HOBBIES_2,2016-05-03,325.00256 +HOBBIES_2,2016-05-04,332.32742 +HOBBIES_2,2016-05-05,348.48566 +HOBBIES_2,2016-05-06,397.46094 +HOBBIES_2,2016-05-07,463.35196 +HOBBIES_2,2016-05-08,445.56622 +HOBBIES_2,2016-05-09,360.51288 +HOBBIES_2,2016-05-10,336.52014 +HOBBIES_2,2016-05-11,344.28247 +HOBBIES_2,2016-05-12,358.7079 +HOBBIES_2,2016-05-13,409.6697 +HOBBIES_2,2016-05-14,475.46484 +HOBBIES_2,2016-05-15,455.52716 +HOBBIES_2,2016-05-16,381.3134 +HOBBIES_2,2016-05-17,355.26096 +HOBBIES_2,2016-05-18,351.80453 +HOBBIES_2,2016-05-19,363.197 +HOBBIES_2,2016-05-20,404.1736 +HOBBIES_2,2016-05-21,471.72308 +HOBBIES_2,2016-05-22,452.07477 +HOUSEHOLD_1,2016-04-25,7322.5625 +HOUSEHOLD_1,2016-04-26,6919.1865 +HOUSEHOLD_1,2016-04-27,6807.973 +HOUSEHOLD_1,2016-04-28,6930.8086 +HOUSEHOLD_1,2016-04-29,8116.5 +HOUSEHOLD_1,2016-04-30,10300.233 +HOUSEHOLD_1,2016-05-01,10267.285 +HOUSEHOLD_1,2016-05-02,7921.134 +HOUSEHOLD_1,2016-05-03,7284.6235 +HOUSEHOLD_1,2016-05-04,7280.303 +HOUSEHOLD_1,2016-05-05,7267.668 +HOUSEHOLD_1,2016-05-06,8540.003 +HOUSEHOLD_1,2016-05-07,10456.705 +HOUSEHOLD_1,2016-05-08,10088.888 +HOUSEHOLD_1,2016-05-09,7604.306 +HOUSEHOLD_1,2016-05-10,6985.8867 +HOUSEHOLD_1,2016-05-11,6745.779 +HOUSEHOLD_1,2016-05-12,6693.4326 +HOUSEHOLD_1,2016-05-13,7825.8516 +HOUSEHOLD_1,2016-05-14,9895.505 +HOUSEHOLD_1,2016-05-15,9434.72 +HOUSEHOLD_1,2016-05-16,7175.374 +HOUSEHOLD_1,2016-05-17,6486.9434 +HOUSEHOLD_1,2016-05-18,6495.8496 +HOUSEHOLD_1,2016-05-19,6345.693 +HOUSEHOLD_1,2016-05-20,7672.4624 +HOUSEHOLD_1,2016-05-21,9825.944 +HOUSEHOLD_1,2016-05-22,9556.082 +HOUSEHOLD_2,2016-04-25,1931.113 +HOUSEHOLD_2,2016-04-26,1782.4025 +HOUSEHOLD_2,2016-04-27,1758.2009 +HOUSEHOLD_2,2016-04-28,1763.3115 +HOUSEHOLD_2,2016-04-29,2031.7482 +HOUSEHOLD_2,2016-04-30,2627.6375 +HOUSEHOLD_2,2016-05-01,2618.0635 +HOUSEHOLD_2,2016-05-02,1939.3312 +HOUSEHOLD_2,2016-05-03,1775.9213 +HOUSEHOLD_2,2016-05-04,1784.6147 +HOUSEHOLD_2,2016-05-05,1768.6473 +HOUSEHOLD_2,2016-05-06,2086.8005 +HOUSEHOLD_2,2016-05-07,2645.3496 +HOUSEHOLD_2,2016-05-08,2584.8975 +HOUSEHOLD_2,2016-05-09,1910.047 +HOUSEHOLD_2,2016-05-10,1752.4678 +HOUSEHOLD_2,2016-05-11,1736.5 +HOUSEHOLD_2,2016-05-12,1733.4746 +HOUSEHOLD_2,2016-05-13,2037.8102 +HOUSEHOLD_2,2016-05-14,2586.608 +HOUSEHOLD_2,2016-05-15,2516.9414 +HOUSEHOLD_2,2016-05-16,1902.0074 +HOUSEHOLD_2,2016-05-17,1732.1702 +HOUSEHOLD_2,2016-05-18,1742.648 +HOUSEHOLD_2,2016-05-19,1724.6858 +HOUSEHOLD_2,2016-05-20,2035.2493 +HOUSEHOLD_2,2016-05-21,2608.6196 +HOUSEHOLD_2,2016-05-22,2549.3857 diff --git a/nbs/docs/getting-started/7_why_timegpt.ipynb b/nbs/docs/getting-started/7_why_timegpt.ipynb new file mode 100644 index 00000000..9b3c7f08 --- /dev/null +++ b/nbs/docs/getting-started/7_why_timegpt.ipynb @@ -0,0 +1,888 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#| hide\n", + "!pip install -Uqq nixtla" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/Users/yibeihu/opt/anaconda3/envs/report/lib/python3.9/site-packages/dask/dataframe/__init__.py:42: FutureWarning: \n", + "Dask dataframe query planning is disabled because dask-expr is not installed.\n", + "\n", + "You can install it with `pip install dask[dataframe]` or `conda install dask`.\n", + "This will raise in a future version.\n", + "\n", + " warnings.warn(msg, FutureWarning)\n" + ] + } + ], + "source": [ + "#| hide \n", + "from nixtla.utils import in_colab" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#| hide \n", + "IN_COLAB = in_colab()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#| hide\n", + "if not IN_COLAB:\n", + " from nixtla.utils import colab_badge\n", + " from dotenv import load_dotenv" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Why TimeGPT?" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "In this notebook, we compare the performance of TimeGPT against three forecasting models: the classical model (ARIMA), the machine learning model (LightGBM), and the deep learning model (N-HiTS), using a subset of data from the M5 Forecasting competition. We want to highlight three top-rated benefits our users love about TimeGPT:\n", + "\n", + "🎯 **Accuracy**: TimeGPT consistently outperforms traditional models by capturing complex patterns with precision.\n", + "\n", + "⚑ **Speed**: Generate forecasts faster without needing extensive training or tuning for each series.\n", + "\n", + "πŸš€ **Ease of Use**: Minimal setup and no complex preprocessing make TimeGPT accessible and ready to use right out of the box!\n", + "\n", + "Before diving into the notebook, please visit our [dashboard](https://dashboard.nixtla.io) to generate your TimeGPT `api_key` and give it a try yourself!" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Table of Contents\n", + "\n", + "1. [Data Introduction](#data-introduction)\n", + "2. [Model Fitting](#model-fitting-timegpt-arima-lgbregressor-n-hits)\n", + " 1. [Fitting Time GPT](#timegpt)\n", + " 2. [Fitting ARIMA](#classical-models-arima)\n", + " 3. [Fitting Light GBM](#machine-learning-models-lgbmregressor)\n", + " 4. [Fitting NHITS](#n-hits)\n", + "3. [Results and Evaluation](#performance-comparison-and-results)\n", + "4. [Conclusion](#conclusion)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "data": { + "text/markdown": [ + "[![](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/github/Nixtla/nixtla/blob/main/nbs/docs/getting-started/7_why_timegpt.ipynb)" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "#| echo: false\n", + "if not IN_COLAB:\n", + " load_dotenv()\n", + " colab_badge('docs/getting-started/7_why_timegpt')" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "import os\n", + "import numpy as np\n", + "import pandas as pd\n", + "import matplotlib.pyplot as plt\n", + "\n", + "from nixtla import NixtlaClient\n", + "from utilsforecast.plotting import plot_series\n", + "from utilsforecast.losses import mae, rmse, smape\n", + "from utilsforecast.evaluation import evaluate" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "nixtla_client = NixtlaClient(\n", + " # api_key = 'my_api_key_provided_by_nixtla'\n", + ")" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## 1. Data introduction" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "In this notebook, we’re working with an aggregated dataset from the M5 Forecasting - Accuracy competition. This dataset includes **7 daily time series**, each with **1,941 data points**. The last **28 data points** of each series are set aside as the test set, allowing us to evaluate model performance on unseen data." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "df = pd.read_csv('https://datasets-nixtla.s3.amazonaws.com/demand_example.csv', parse_dates=['ds'])" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
dsy
minmaxcountminmeanmedianmax
unique_id
FOODS_12011-01-292016-05-2219410.02674.0855232665.05493.0
FOODS_22011-01-292016-05-2219410.04015.9840293894.09069.0
FOODS_32011-01-292016-05-22194110.016969.08912916548.028663.0
HOBBIES_12011-01-292016-05-2219410.02936.1226172908.05009.0
HOBBIES_22011-01-292016-05-2219410.0279.053065248.0871.0
HOUSEHOLD_12011-01-292016-05-2219410.06039.5945395984.011106.0
HOUSEHOLD_22011-01-292016-05-2219410.01566.8402891520.02926.0
\n", + "
" + ], + "text/plain": [ + " ds y \n", + " min max count min mean median max\n", + "unique_id \n", + "FOODS_1 2011-01-29 2016-05-22 1941 0.0 2674.085523 2665.0 5493.0\n", + "FOODS_2 2011-01-29 2016-05-22 1941 0.0 4015.984029 3894.0 9069.0\n", + "FOODS_3 2011-01-29 2016-05-22 1941 10.0 16969.089129 16548.0 28663.0\n", + "HOBBIES_1 2011-01-29 2016-05-22 1941 0.0 2936.122617 2908.0 5009.0\n", + "HOBBIES_2 2011-01-29 2016-05-22 1941 0.0 279.053065 248.0 871.0\n", + "HOUSEHOLD_1 2011-01-29 2016-05-22 1941 0.0 6039.594539 5984.0 11106.0\n", + "HOUSEHOLD_2 2011-01-29 2016-05-22 1941 0.0 1566.840289 1520.0 2926.0" + ] + }, + "execution_count": null, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.groupby('unique_id').agg({\"ds\":[\"min\",\"max\",\"count\"],\\\n", + " \"y\":[\"min\",\"mean\",\"median\",\"max\"]})" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "(13391, 3) (196, 3)\n" + ] + } + ], + "source": [ + "df_train = df.query('ds <= \"2016-04-24\"')\n", + "df_test = df.query('ds > \"2016-04-24\"')\n", + "\n", + "print(df_train.shape, df_test.shape)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## 2. Model Fitting (TimeGPT, ARIMA, LightGBM, N-HiTS)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### 2.1 TimeGPT\n", + "TimeGPT offers a powerful, streamlined solution for time series forecasting, delivering state-of-the-art results with minimal effort. With TimeGPT, there's no need for data preprocessing or feature engineering -- simply initiate the Nixtla client and call `nixtla_client.forecast` to produce accurate, high-performance forecasts tailored to your unique time series.\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "INFO:nixtla.nixtla_client:Validating inputs...\n", + "INFO:nixtla.nixtla_client:Inferred freq: D\n", + "INFO:nixtla.nixtla_client:Querying model metadata...\n", + "INFO:nixtla.nixtla_client:Preprocessing dataframes...\n", + "INFO:nixtla.nixtla_client:Calling Forecast Endpoint...\n" + ] + } + ], + "source": [ + "# Forecast with TimeGPT\n", + "fcst_timegpt = nixtla_client.forecast(df = df_train,\n", + " target_col = 'y', \n", + " h=28, # Forecast horizon, predicts the next 28 time steps\n", + " model='timegpt-1-long-horizon', # Use the model for long-horizon forecasting\n", + " finetune_steps=10, # Number of finetuning steps\n", + " level = [90]) # Generate a 90% confidence interval" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "metric\n", + "rmse 592.607378\n", + "smape 0.049403\n", + "Name: TimeGPT, dtype: float64" + ] + }, + "execution_count": null, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# Evaluate performance and plot forecast\n", + "fcst_timegpt['ds'] = pd.to_datetime(fcst_timegpt['ds'])\n", + "test_df = pd.merge(df_test, fcst_timegpt, 'left', ['unique_id', 'ds'])\n", + "evaluation_timegpt = evaluate(test_df, metrics=[rmse, smape], models=[\"TimeGPT\"])\n", + "evaluation_timegpt.groupby(['metric'])['TimeGPT'].mean()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### 2.2 Classical Models (ARIMA):\n", + "Next, we applied ARIMA, a traditional statistical model, to the same forecasting task. Classical models use historical trends and seasonality to make predictions by relying on linear assumptions. However, they struggled to capture the complex, non-linear patterns within the data, leading to lower accuracy compared to other approaches. Additionally, ARIMA was slower due to its iterative parameter estimation process, which becomes computationally intensive for larger datasets." + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "> πŸ“˜ Why Use TimeGPT over Classical Models?\n", + ">\n", + "> * **Complex Patterns**: TimeGPT captures non-linear trends classical models miss.\n", + ">\n", + "> * **Minimal Preprocessing**: TimeGPT requires little to no data preparation.\n", + ">\n", + "> * **Scalability**: TimeGPT can efficiently scales across multiple series without retraining." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#| eval: false\n", + "from statsforecast import StatsForecast\n", + "from statsforecast.models import AutoARIMA" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#| eval: false\n", + "#Initiate ARIMA model\n", + "sf = StatsForecast(\n", + " models=[AutoARIMA(season_length=7)],\n", + " freq='D'\n", + ")\n", + "# Fit and forecast\n", + "fcst_arima = sf.forecast(h=28, df=df_train) " + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#| hide\n", + "fcst_arima = pd.read_csv('../../assets/arima_rst.csv', parse_dates=['ds'])" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "metric\n", + "rmse 724.957364\n", + "smape 0.055018\n", + "Name: AutoARIMA, dtype: float64" + ] + }, + "execution_count": null, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "fcst_arima.reset_index(inplace=True)\n", + "test_df = pd.merge(df_test, fcst_arima, 'left', ['unique_id', 'ds'])\n", + "evaluation_arima = evaluate(test_df, metrics=[rmse, smape], models=[\"AutoARIMA\"])\n", + "evaluation_arima.groupby(['metric'])['AutoARIMA'].mean()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### 2.3 Machine Learning Models (LightGBM)\n", + "\n", + "Thirdly, we used a machine learning model, LightGBM, for the same forecasting task, implemented through the automated pipeline provided by our mlforecast library.\n", + "While LightGBM can capture seasonality and patterns, achieving the best performance often requires detailed feature engineering, careful hyperparameter tuning, and domain knowledge. You can try our mlforecast library to simplify this process and get started quickly!" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "> πŸ“˜ Why Use TimeGPT over Machine Learning Models?\n", + ">\n", + "> * **Automatic Pattern Recognition**: Captures complex patterns from raw data, bypassing the need for feature engineering.\n", + ">\n", + "> * **Minimal Tuning**: Works well without extensive tuning.\n", + ">\n", + "> * **Scalability**: Forecasts across multiple series without retraining." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#| eval: false\n", + "import optuna\n", + "from mlforecast.auto import AutoMLForecast, AutoLightGBM\n", + "\n", + "# Suppress Optuna's logging output\n", + "optuna.logging.set_verbosity(optuna.logging.ERROR)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#| eval: false\n", + "# Initialize an automated forecasting pipeline using AutoMLForecast.\n", + "mlf = AutoMLForecast(\n", + " models=[AutoLightGBM()],\n", + " freq='D',\n", + " season_length=7, \n", + " fit_config=lambda trial: {'static_features': ['unique_id']}\n", + ")\n", + "\n", + "# Fit the model to the training dataset.\n", + "mlf.fit(\n", + " df=df_train.astype({'unique_id': 'category'}),\n", + " n_windows=1,\n", + " h=28,\n", + " num_samples=10,\n", + ")\n", + "fcst_lgbm = mlf.predict(28)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#| hide\n", + "fcst_lgbm = pd.read_csv('../../assets/lgbm_rst.csv', parse_dates=['ds'])" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "metric\n", + "rmse 687.773744\n", + "smape 0.051448\n", + "Name: AutoLightGBM, dtype: float64" + ] + }, + "execution_count": null, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "test_df = pd.merge(df_test, fcst_lgbm, 'left', ['unique_id', 'ds'])\n", + "evaluation_lgbm = evaluate(test_df, metrics=[rmse, smape], models=[\"AutoLightGBM\"])\n", + "evaluation_lgbm.groupby(['metric'])['AutoLightGBM'].mean()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### 2.4 N-HiTS\n", + "\n", + "Lastly, we used N-HiTS, a state-of-the-art deep learning model designed for time series forecasting. The model produced accurate results, demonstrating its ability to capture complex, non-linear patterns within the data. However, setting up and tuning N-HiTS required significantly more time and computational resources compared to TimeGPT." + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "> πŸ“˜ Why Use TimeGPT Over Deep Learning Models?\n", + ">\n", + "> * **Faster Setup**: Quick setup and forecasting, unlike the lengthy configuration and training times of neural networks.\n", + ">\n", + "> * **Less Tuning**: Performs well with minimal tuning and preprocessing, while neural networks often need extensive adjustments.\n", + ">\n", + "> * **Ease of Use**: Simple deployment with high accuracy, making it accessible without deep technical expertise." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#| eval: false\n", + "from neuralforecast.core import NeuralForecast\n", + "from neuralforecast.models import NHITS" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#| eval: false\n", + "# Initialize the N-HiTS model.\n", + "models = [NHITS(h=28, \n", + " input_size=28, \n", + " max_steps=100)]\n", + "\n", + "# Fit the model using training data\n", + "nf = NeuralForecast(models=models, freq='D')\n", + "nf.fit(df=df_train)\n", + "fcst_nhits = nf.predict()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#| hide\n", + "fcst_nhits = pd.read_csv('../../assets/nhits_rst.csv', parse_dates=['ds'])" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "metric\n", + "rmse 605.011948\n", + "smape 0.053446\n", + "Name: NHITS, dtype: float64" + ] + }, + "execution_count": null, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "test_df = pd.merge(df_test,fcst_nhits, 'left', ['unique_id', 'ds'])\n", + "evaluation_nhits = evaluate(test_df, metrics=[rmse, smape], models=[\"NHITS\"])\n", + "evaluation_nhits.groupby(['metric'])['NHITS'].mean()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## 3. Performance Comparison and Results:\n", + "The performance of each model is evaluated using RMSE (Root Mean Squared Error) and SMAPE (Symmetric Mean Absolute Percentage Error). While RMSE emphasizes the models’ ability to control significant errors, SMAPE provides a relative performance perspective by normalizing errors as percentages. Below, we present a snapshot of performance across all groups. The results demonstrate that TimeGPT outperforms other models on both metrics.\n", + "\n", + "🌟 For a deeper dive into benchmarking, check out our benchmark repository. The summarized results are displayed below:" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "#### Overall Performance Metrics\n", + "\n", + "| **Model** | **RMSE** | **SMAPE** |\n", + "|------------------|----------|-----------|\n", + "| ARIMA | 724.9 | 5.50% |\n", + "| LightGBM | 687.8 | 5.14% |\n", + "| N-HiTS | 605.0 | 5.34% |\n", + "| **TimeGPT** | **592.6**| **4.94%** |\n", + " \n", + "\n", + "#### Breakdown for Each Time-series\n", + "Followed below are the metrics for each individual time series groups. TimeGPT consistently delivers accurate forecasts across all time series groups. In many cases, it performs as well as or better than data-specific models, showing its versatility and reliability across different datasets." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "#| echo: false\n", + "evaluation_df = evaluation_arima.merge(evaluation_lgbm, on = ['unique_id','metric'], how = 'left')\\\n", + " .merge(evaluation_nhits, on = ['unique_id','metric'], how = 'left')\\\n", + " .merge(evaluation_timegpt, on = ['unique_id','metric'], how = 'left')" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "# | echo: false\n", + "colors = [\n", + " (\"#A9B9C3\", 0.5), # Grey-bluish color 1\n", + " (\"#7A8D9D\", 0.5), # Grey-bluish color 2\n", + " (\"#5B6D79\", 0.5), # Grey-bluish color 3\n", + " ('#F95D6A', 0.75) # Green color for the last\n", + "]\n", + "\n", + "\n", + "# Filter evaluation data by metric and set unique_id as index\n", + "rmse_df = evaluation_df[evaluation_df['metric'] == 'rmse'].set_index('unique_id')\n", + "smape_df = evaluation_df[evaluation_df['metric'] == 'smape'].set_index('unique_id')\n", + "\n", + "# Plot function with custom colors and opacity\n", + "def plot_metric(ax, df, title, ylabel):\n", + " x = np.arange(len(df))\n", + " bar_width = 0.2\n", + " for i, (col, (color, alpha)) in enumerate(zip(df.columns[1:], colors)):\n", + " ax.bar(x + i * bar_width, df[col], width=bar_width, label=col, color=color, alpha=alpha)\n", + " ax.set(title=title, ylabel=ylabel, xticks=x + bar_width * (len(df.columns[1:]) - 1) / 2, xticklabels=df.index)\n", + " ax.tick_params(axis='x', rotation=45)\n", + " ax.legend()\n", + "\n", + "# Generate side-by-side plots for RMSE and SMAPE\n", + "fig, axes = plt.subplots(1, 2, figsize=(14, 6))\n", + "plot_metric(axes[0], rmse_df, \"RMSE Comparison Across Models\", \"RMSE\")\n", + "plot_metric(axes[1], smape_df*100, \"%SMAPE Comparison Across Models\", \"SMAPE\")\n", + "\n", + "plt.tight_layout()\n", + "plt.show()\n", + " " + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "#### Benchmark Results\n", + "For a more comprehensive dive into model accuracy and performance, explore our [Time Series Model Arena](https://github.com/Nixtla/nixtla/tree/main/experiments/foundation-time-series-arena)! TimeGPT continues to lead the pack with exceptional performance across benchmarks! 🌟\n", + "\n", + "![image](https://github.com/Nixtla/nixtla/assets/10517170/1c042591-0585-4a5b-a548-2017a28f2d4f)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## 4. Conclusion\n", + "At the end of this notebook, we’ve put together a handy table to show you exactly where TimeGPT shines brightest compared to other forecasting models. β˜€οΈ Think of it as your quick guide to choosing the best model for your unique project needs. We’re confident that TimeGPT will be a valuable tool in your forecasting journey. Don’t forget to visit our [dashboard](https://dashboard.nixtla.io) to generate your TimeGPT `api_key` and get started today! Happy forecasting, and enjoy the insights ahead! " + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
ScenarioTimeGPTClassical Models (e.g., ARIMA)Machine Learning Models (e.g., XGB, LGBM)Deep Learning Models (e.g., N-HITS)
Seasonal Patternsβœ… Performs well with minimal setupβœ… Handles seasonality with adjustments (e.g., SARIMA)βœ… Performs well with feature engineeringβœ… Captures seasonal patterns effectively
Non-Linear Patternsβœ… Excels, especially with complex non-linear patterns❌ Limited performance❌ Struggles without extensive feature engineeringβœ… Performs well with non-linear relationships
Large Datasetβœ… Highly scalable across many series❌ Slow and resource-intensiveβœ… Scalable with optimized implementations❌ Requires significant resources for large datasets
Small Datasetβœ… Performs well; requires only one data point to startβœ… Performs well; may struggle with very sparse dataβœ… Performs adequately if enough features are extracted❌ May need a minimum data size to learn effectively
Preprocessing Requiredβœ… Minimal preprocessing needed❌ Requires scaling, log-transform, etc., to meet model assumptions.❌ Requires extensive feature engineering for complex patterns❌ Needs data normalization and preprocessing
Accuracy Requirementβœ… Achieves high accuracy with minimal tuning❌ May struggle with complex accuracy requirementsβœ… Can achieve good accuracy with tuningβœ… High accuracy possible but with significant resource use
Scalabilityβœ… Highly scalable with minimal task-specific configuration❌ Not easily scalableβœ… Moderate scalability, with feature engineering and tuning per task❌ Limited scalability due to resource demands
Computational Resourcesβœ… Highly efficient, operates seamlessly on CPU, no GPU neededβœ… Light to moderate, scales poorly with large datasets❌ Moderate, depends on feature complexity❌ High resource consumption, often requires GPU
Memory Requirementβœ… Efficient memory usage for large datasetsβœ… Moderate memory requirements❌ High memory usage for larger datasets or many series cases❌ High memory consumption for larger datasets and multiple series
Technical Requirements & Domain Knowledgeβœ… Low; minimal technical setup and no domain expertise neededβœ… Low to moderate; needs understanding of stationarity❌ Moderate to high; requires feature engineering and tuning❌ High; complex architecture and tuning
\n" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "python3", + "language": "python", + "name": "python3" + } + }, + "nbformat": 4, + "nbformat_minor": 2 +}