I have a data frame that has aggregate data over every 5 days(called a week in the dataset).
> dput(Sample3)
structure(list(Firm = c("ENG", "ENG", "ENG", "ENG", "ENG", "AUS",
"AUS", "AUS", "AUS", "AUS", "NZ", "NZ", "NZ", "NZ", "NZ"), Week = c(1,
2, 3, 4, 5, 1, 2, 3, 4, 5, 1, 2, 3, 4, 5), TotalSales = c(200,
155, 195, 150, 155, 140, 145, 150, 155, 160, 120, 125, 130, 135,
140)), class = c("tbl_df", "tbl", "data.frame"), row.names = c(NA,
-15L), .Names = c("Firm", "Week", "TotalSales"))
I want to join it with another data frame that has daily output values for three production departments AP,BG, and CK.
> dput(Sample2)
structure(list(Firm = c("ENG", "ENG", "ENG", "ENG", "ENG", "ENG",
"ENG", "ENG", "ENG", "ENG", "ENG", "ENG", "ENG", "ENG", "ENG",
"ENG", "ENG", "ENG", "ENG", "ENG", "ENG", "ENG", "ENG", "ENG",
"ENG", "ENG", "ENG", "AUS", "AUS", "AUS", "AUS", "AUS", "AUS",
"AUS", "AUS", "AUS", "AUS", "AUS", "AUS", "AUS", "AUS", "AUS",
"AUS", "AUS", "AUS", "AUS", "AUS", "AUS", "AUS", "AUS", "AUS",
"AUS", "AUS", "AUS", "NZ", "NZ", "NZ", "NZ", "NZ", "NZ", "NZ",
"NZ", "NZ", "NZ", "NZ", "NZ", "NZ", "NZ", "NZ", "NZ", "NZ", "NZ",
"NZ", "NZ", "NZ", "NZ", "NZ", "NZ", "NZ", "NZ", "NZ"), Date = structure(c(1451865600,
1451952000, 1452038400, 1452124800, 1452211200, 1452470400, 1452556800,
1452643200, 1452729600, 1452816000, 1453075200, 1453161600, 1453248000,
1453334400, 1453420800, 1453680000, 1453852800, 1453939200, 1454025600,
1454284800, 1454371200, 1454457600, 1454544000, 1454630400, 1454889600,
1454976000, 1455062400, 1451865600, 1451952000, 1452038400, 1452124800,
1452211200, 1452470400, 1452556800, 1452643200, 1452729600, 1452816000,
1453075200, 1453161600, 1453248000, 1453334400, 1453420800, 1453680000,
1453852800, 1453939200, 1454025600, 1454284800, 1454371200, 1454457600,
1454544000, 1454630400, 1454889600, 1454976000, 1455062400, 1451865600,
1451952000, 1452038400, 1452124800, 1452211200, 1452470400, 1452556800,
1452643200, 1452729600, 1452816000, 1453075200, 1453161600, 1453248000,
1453334400, 1453420800, 1453680000, 1453852800, 1453939200, 1454025600,
1454284800, 1454371200, 1454457600, 1454544000, 1454630400, 1454889600,
1454976000, 1455062400), class = c("POSIXct", "POSIXt"), tzone = "UTC"),
AP = c(75451.0611, 70753.7178, 72662.012, 77799.73, 79414.4391,
81469.5286, 81029.1539, 82203.4883, 90183.0465, 91850.0159,
92516.8063, 94350.4702, 91683.3215, 95017.2605, 97184.3196,
97684.4091, 98184.5051, 99017.9898, 100851.6537, 99684.7738,
99518.0794, 100351.5641, 99684.7738, 99518.0794, 100018.1689,
101185.0489, 103852.1975, 81469.5286, 81029.1539, 82203.4883,
90183.0465, 91850.0159, 104852.383, 106019.2565, 100518.2585,
98017.8043, 108686.4052, 81469.5286, 81029.1539, 82203.4883,
90183.0465, 91850.0159, 110686.7762, 111853.6497, 115354.2831,
115854.379, 116687.8638, 104852.383, 106019.2565, 100518.2585,
98017.8043, 81469.5286, 81029.1539, 82203.4883, 75451.0611,
70753.7178, 72662.012, 77799.73, 79414.4391, 81469.5286,
81029.1539, 82203.4883, 90183.0465, 91850.0159, 92516.8063,
94350.4702, 91683.3215, 95017.2605, 97184.3196, 97684.4091,
98184.5051, 99017.9898, 100851.6537, 99684.7738, 99518.0794,
100351.5641, 99684.7738, 99518.0794, 100018.1689, 101185.0489,
103852.1975), BG = c(104852.383, 106019.2565, 100518.2585,
98017.8043, 108686.4052, 114854.1999, 116021.0734, 117354.6541,
113020.536, 114020.7151, 110686.7762, 111853.6497, 115354.2831,
115854.379, 116687.8638, 117021.2526, 115187.5887, 114354.104,
113520.6192, 109853.2914, 109186.5011, 107686.226, 107352.8372,
106852.7413, 116687.8638, 117021.2526, 115187.5887, 75451.0611,
70753.7178, 72662.012, 77799.73, 79414.4391, 81469.5286,
81029.1539, 82203.4883, 90183.0465, 91850.0159, 92516.8063,
94350.4702, 91683.3215, 95017.2605, 97184.3196, 97684.4091,
98184.5051, 99017.9898, 100851.6537, 99684.7738, 99518.0794,
100351.5641, 99684.7738, 99518.0794, 100018.1689, 101185.0489,
103852.1975, 81469.5286, 81029.1539, 82203.4883, 90183.0465,
91850.0159, 104852.383, 106019.2565, 100518.2585, 98017.8043,
108686.4052, 81469.5286, 81029.1539, 82203.4883, 90183.0465,
91850.0159, 110686.7762, 111853.6497, 115354.2831, 115854.379,
116687.8638, 104852.383, 106019.2565, 100518.2585, 98017.8043,
81469.5286, 81029.1539, 82203.4883), CK = c(81469.5286, 81029.1539,
82203.4883, 90183.0465, 91850.0159, 104852.383, 106019.2565,
100518.2585, 98017.8043, 108686.4052, 81469.5286, 81029.1539,
82203.4883, 90183.0465, 91850.0159, 110686.7762, 111853.6497,
115354.2831, 115854.379, 116687.8638, 104852.383, 106019.2565,
100518.2585, 98017.8043, 81469.5286, 81029.1539, 82203.4883,
104852.383, 106019.2565, 100518.2585, 98017.8043, 108686.4052,
114854.1999, 116021.0734, 117354.6541, 113020.536, 114020.7151,
110686.7762, 111853.6497, 115354.2831, 115854.379, 116687.8638,
117021.2526, 115187.5887, 114354.104, 113520.6192, 109853.2914,
109186.5011, 107686.226, 107352.8372, 106852.7413, 116687.8638,
117021.2526, 115187.5887, 75451.0611, 70753.7178, 72662.012,
77799.73, 79414.4391, 81469.5286, 81029.1539, 82203.4883,
90183.0465, 91850.0159, 92516.8063, 94350.4702, 91683.3215,
95017.2605, 97184.3196, 97684.4091, 98184.5051, 99017.9898,
100851.6537, 99684.7738, 99518.0794, 100351.5641, 99684.7738,
99518.0794, 100018.1689, 101185.0489, 103852.1975), Week = c(1,
1, 1, 1, 1, 2, 2, 2, 2, 2, 3, 3, 3, 3, 3, 4, 4, 4, 4, 4,
5, 5, 5, 5, 5, 6, 6, 1, 1, 1, 1, 1, 2, 2, 2, 2, 2, 3, 3,
3, 3, 3, 4, 4, 4, 4, 4, 5, 5, 5, 5, 5, 6, 6, 1, 1, 1, 1,
1, 2, 2, 2, 2, 2, 3, 3, 3, 3, 3, 4, 4, 4, 4, 4, 5, 5, 5,
5, 5, 6, 6)), .Names = c("Firm", "Date", "AP", "BG", "CK",
"Week"), row.names = c(NA, -81L), class = c("tbl_df", "tbl",
"data.frame"))
I want to make a data frame that looks like this
> dput(SampleFinal)
structure(list(Firm = c("ENG", "ENG", "ENG", "ENG", "ENG", "ENG",
"ENG", "ENG", "ENG", "ENG", "ENG", "ENG", "ENG", "ENG", "ENG",
"ENG", "ENG", "ENG", "ENG", "ENG", "ENG", "ENG", "ENG", "ENG",
"ENG", "ENG", "ENG", "AUS", "AUS", "AUS", "AUS", "AUS", "AUS",
"AUS", "AUS", "AUS", "AUS", "AUS", "AUS", "AUS", "AUS", "AUS",
"AUS", "AUS", "AUS", "AUS", "AUS", "AUS", "AUS", "AUS", "AUS",
"AUS", "AUS", "AUS", "NZ", "NZ", "NZ", "NZ", "NZ", "NZ", "NZ",
"NZ", "NZ", "NZ", "NZ", "NZ", "NZ", "NZ", "NZ", "NZ", "NZ", "NZ",
"NZ", "NZ", "NZ", "NZ", "NZ", "NZ", "NZ", "NZ", "NZ"), Date = structure(c(1451865600,
1451952000, 1452038400, 1452124800, 1452211200, 1452470400, 1452556800,
1452643200, 1452729600, 1452816000, 1453075200, 1453161600, 1453248000,
1453334400, 1453420800, 1453680000, 1453852800, 1453939200, 1454025600,
1454284800, 1454371200, 1454457600, 1454544000, 1454630400, 1454889600,
1454976000, 1455062400, 1451865600, 1451952000, 1452038400, 1452124800,
1452211200, 1452470400, 1452556800, 1452643200, 1452729600, 1452816000,
1453075200, 1453161600, 1453248000, 1453334400, 1453420800, 1453680000,
1453852800, 1453939200, 1454025600, 1454284800, 1454371200, 1454457600,
1454544000, 1454630400, 1454889600, 1454976000, 1455062400, 1451865600,
1451952000, 1452038400, 1452124800, 1452211200, 1452470400, 1452556800,
1452643200, 1452729600, 1452816000, 1453075200, 1453161600, 1453248000,
1453334400, 1453420800, 1453680000, 1453852800, 1453939200, 1454025600,
1454284800, 1454371200, 1454457600, 1454544000, 1454630400, 1454889600,
1454976000, 1455062400), class = c("POSIXct", "POSIXt"), tzone = "UTC"),
Week = c("1", "1", "1", "1", "1", "2", "2", "2", "2", "2",
"3", "3", "3", "3", "3", "4", "4", "4", "4", "4", "5", "5",
"5", "5", "5", "NA", "NA", "1", "1", "1", "1", "1", "2",
"2", "2", "2", "2", "3", "3", "3", "3", "3", "4", "4", "4",
"4", "4", "5", "5", "5", "5", "5", "NA", "NA", "1", "1",
"1", "1", "1", "2", "2", "2", "2", "2", "3", "3", "3", "3",
"3", "4", "4", "4", "4", "4", "5", "5", "5", "5", "5", "NA",
"NA"), TotalSales = c("200", "200", "200", "200", "200",
"155", "155", "155", "155", "155", "195", "195", "195", "195",
"195", "150", "150", "150", "150", "150", "155", "155", "155",
"155", "155", "NA", "NA", "140", "140", "140", "140", "140",
"145", "145", "145", "145", "145", "150", "150", "150", "150",
"150", "155", "155", "155", "155", "155", "160", "160", "160",
"160", "160", "NA", "NA", "120", "120", "120", "120", "120",
"125", "125", "125", "125", "125", "130", "130", "130", "130",
"130", "135", "135", "135", "135", "135", "140", "140", "140",
"140", "140", "NA", "NA"), AP = c("75451.061100000006", "70753.717799999999",
"72662.012000000002", "77799.73", "79414.439100000003", "81469.528600000005",
"81029.153900000005", "82203.488299999997", "90183.046499999997",
"91850.015899999999", "92516.806299999997", "94350.470199999996",
"91683.321500000005", "95017.260500000004", "97184.319600000003",
"97684.409100000004", "98184.505099999995", "99017.989799999996",
"100851.6537", "99684.773799999995", "99518.079400000002",
"100351.5641", "99684.773799999995", "99518.079400000002",
"100018.1689", "NA", "NA", "81469.528600000005", "81029.153900000005",
"82203.488299999997", "90183.046499999997", "91850.015899999999",
"104852.383", "106019.2565", "100518.2585", "98017.804300000003",
"108686.40519999999", "81469.528600000005", "81029.153900000005",
"82203.488299999997", "90183.046499999997", "91850.015899999999",
"110686.77619999999", "111853.64969999999", "115354.2831",
"115854.379", "116687.86380000001", "104852.383", "106019.2565",
"100518.2585", "98017.804300000003", "81469.528600000005",
"NA", "NA", "75451.061100000006", "70753.717799999999", "72662.012000000002",
"77799.73", "79414.439100000003", "81469.528600000005", "81029.153900000005",
"82203.488299999997", "90183.046499999997", "91850.015899999999",
"92516.806299999997", "94350.470199999996", "91683.321500000005",
"95017.260500000004", "97184.319600000003", "97684.409100000004",
"98184.505099999995", "99017.989799999996", "100851.6537",
"99684.773799999995", "99518.079400000002", "100351.5641",
"99684.773799999995", "99518.079400000002", "100018.1689",
"NA", "NA"), BG = c("104852.383", "106019.2565", "100518.2585",
"98017.804300000003", "108686.40519999999", "114854.19990000001",
"116021.07339999999", "117354.6541", "113020.53599999999",
"114020.7151", "110686.77619999999", "111853.64969999999",
"115354.2831", "115854.379", "116687.86380000001", "117021.25260000001",
"115187.58869999999", "114354.10400000001", "113520.6192",
"109853.2914", "109186.50109999999", "107686.226", "107352.83719999999",
"106852.74129999999", "116687.86380000001", "NA", "NA", "75451.061100000006",
"70753.717799999999", "72662.012000000002", "77799.73", "79414.439100000003",
"81469.528600000005", "81029.153900000005", "82203.488299999997",
"90183.046499999997", "91850.015899999999", "92516.806299999997",
"94350.470199999996", "91683.321500000005", "95017.260500000004",
"97184.319600000003", "97684.409100000004", "98184.505099999995",
"99017.989799999996", "100851.6537", "99684.773799999995",
"99518.079400000002", "100351.5641", "99684.773799999995",
"99518.079400000002", "100018.1689", "NA", "NA", "81469.528600000005",
"81029.153900000005", "82203.488299999997", "90183.046499999997",
"91850.015899999999", "104852.383", "106019.2565", "100518.2585",
"98017.804300000003", "108686.40519999999", "81469.528600000005",
"81029.153900000005", "82203.488299999997", "90183.046499999997",
"91850.015899999999", "110686.77619999999", "111853.64969999999",
"115354.2831", "115854.379", "116687.86380000001", "104852.383",
"106019.2565", "100518.2585", "98017.804300000003", "81469.528600000005",
"NA", "NA"), CK = c("81469.528600000005", "81029.153900000005",
"82203.488299999997", "90183.046499999997", "91850.015899999999",
"104852.383", "106019.2565", "100518.2585", "98017.804300000003",
"108686.40519999999", "81469.528600000005", "81029.153900000005",
"82203.488299999997", "90183.046499999997", "91850.015899999999",
"110686.77619999999", "111853.64969999999", "115354.2831",
"115854.379", "116687.86380000001", "104852.383", "106019.2565",
"100518.2585", "98017.804300000003", "81469.528600000005",
"NA", "NA", "104852.383", "106019.2565", "100518.2585", "98017.804300000003",
"108686.40519999999", "114854.19990000001", "116021.07339999999",
"117354.6541", "113020.53599999999", "114020.7151", "110686.77619999999",
"111853.64969999999", "115354.2831", "115854.379", "116687.86380000001",
"117021.25260000001", "115187.58869999999", "114354.10400000001",
"113520.6192", "109853.2914", "109186.50109999999", "107686.226",
"107352.83719999999", "106852.74129999999", "116687.86380000001",
"NA", "NA", "75451.061100000006", "70753.717799999999", "72662.012000000002",
"77799.73", "79414.439100000003", "81469.528600000005", "81029.153900000005",
"82203.488299999997", "90183.046499999997", "91850.015899999999",
"92516.806299999997", "94350.470199999996", "91683.321500000005",
"95017.260500000004", "97184.319600000003", "97684.409100000004",
"98184.505099999995", "99017.989799999996", "100851.6537",
"99684.773799999995", "99518.079400000002", "100351.5641",
"99684.773799999995", "99518.079400000002", "100018.1689",
"NA", "NA")), class = c("tbl_df", "tbl", "data.frame"), row.names = c(NA,
-81L), .Names = c("Firm", "Date", "Week", "TotalSales", "AP",
"BG", "CK"))
It has the sales value for every week repeated for 5 date values for each firm. New data frame should have all other columns in Sample2.
Also suggest how to make a data frame when every fifth date value of data frame(Sample2) is matched with weekly sales value from data frame(Sample3). The data frames are large so I have given the required links. Please suggest solutions without Data.table package. Thank you very much.
Kindly do not ignore the panel setting of the question before commenting.