2016-10-23 22 views
0

目前我正嘗試根據下面的數據集,以建立堆疊的條形圖:堆積條形圖聊天(ggplot)中的R ::試圖在圖表中創建多個酒吧

Dataset Example

的說明數據: 每個奇數列表示公司變量,每個偶數列表示該公司的產量。 每兩列(公司和生產)代表該小時的生產模式。

這是我的數據:

structure(list(Hour = c(NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, 
NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA), X1 = structure(c(4L, 
5L, 5L, 5L, 5L, 2L, 3L, 5L, 5L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 
1L, 1L, 1L, 1L, 1L), .Label = c("", "B", "C", "Company", "D"), class = "factor"), 
    X1.1 = structure(c(10L, 5L, 7L, 9L, 2L, 4L, 8L, 3L, 6L, 1L, 
    1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L), .Label = c("", 
    "30", "31", "49", "5", "63", "73", "83", "86", "Production" 
    ), class = "factor"), X2 = structure(c(4L, 5L, 2L, 5L, 5L, 
    2L, 5L, 5L, 2L, 3L, 2L, 2L, 3L, 5L, 1L, 1L, 1L, 1L, 1L, 1L, 
    1L, 1L), .Label = c("", "A", "B", "Company", "D"), class = "factor"), 
    X2.1 = structure(c(15L, 10L, 12L, 6L, 11L, 13L, 3L, 14L, 
    5L, 4L, 2L, 9L, 8L, 7L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L), .Label = c("", 
    "15", "32", "34", "36", "5", "50", "52", "58", "71", "73", 
    "74", "78", "98", "Production"), class = "factor"), X3 = structure(c(5L, 
    2L, 2L, 6L, 6L, 6L, 6L, 6L, 6L, 6L, 6L, 4L, 6L, 4L, 3L, 3L, 
    1L, 1L, 1L, 1L, 1L, 1L), .Label = c("", "A", "B", "C", "Company", 
    "D"), class = "factor"), X3.1 = structure(c(17L, 6L, 15L, 
    3L, 4L, 16L, 13L, 7L, 11L, 9L, 5L, 8L, 10L, 14L, 12L, 2L, 
    1L, 1L, 1L, 1L, 1L, 1L), .Label = c("", "1", "11", "14", 
    "19", "33", "42", "43", "50", "57", "68", "81", "82", "84", 
    "85", "95", "Production"), class = "factor"), X4 = structure(c(4L, 
    5L, 1L, 1L, 5L, 5L, 5L, 5L, 1L, 1L, 5L, 5L, 3L, 3L, 3L, 5L, 
    2L, 2L, 5L, 2L, 5L, 5L), .Label = c("A", "B", "C", "Company", 
    "D"), class = "factor"), X4.1 = structure(c(21L, 1L, 18L, 
    12L, 20L, 10L, 5L, 6L, 4L, 11L, 16L, 9L, 3L, 7L, 13L, 19L, 
    8L, 17L, 4L, 2L, 15L, 14L), .Label = c("100", "2", "24", 
    "28", "3", "38", "4", "40", "42", "43", "47", "48", "54", 
    "64", "69", "7", "71", "81", "9", "97", "Production"), class = "factor"), 
    X5 = structure(c(5L, 6L, 6L, 3L, 6L, 6L, 6L, 6L, 2L, 2L, 
    6L, 6L, 6L, 3L, 6L, 3L, 6L, 3L, 4L, 1L, 1L, 1L), .Label = c("", 
    "A", "B", "C", "Company", "D"), class = "factor"), X5.1 = structure(c(18L, 
    12L, 3L, 9L, 14L, 10L, 16L, 2L, 17L, 13L, 5L, 13L, 4L, 7L, 
    6L, 2L, 15L, 11L, 8L, 1L, 1L, 1L), .Label = c("", "0", "1", 
    "12", "25", "30", "34", "38", "39", "45", "46", "58", "60", 
    "68", "73", "78", "97", "Production"), class = "factor"), 
    X6 = structure(c(5L, 3L, 4L, 3L, 6L, 6L, 3L, 3L, 2L, 3L, 
    6L, 3L, 6L, 3L, 2L, 1L, 1L, 1L, 1L, 1L, 1L, 1L), .Label = c("", 
    "A", "B", "C", "Company", "D"), class = "factor"), X6.1 = structure(c(16L, 
    9L, 4L, 5L, 8L, 11L, 15L, 6L, 10L, 7L, 14L, 3L, 12L, 2L, 
    13L, 1L, 1L, 1L, 1L, 1L, 1L, 1L), .Label = c("", "1", "29", 
    "3", "34", "4", "42", "48", "65", "68", "70", "8", "92", 
    "95", "96", "Production"), class = "factor")), .Names = c("Hour", 
"X1", "X1.1", "X2", "X2.1", "X3", "X3.1", "X4", "X4.1", "X5", 
"X5.1", "X6", "X6.1"), class = "data.frame", row.names = c(NA, 
-22L)) 

我可以使用下面的代碼創建一個圖表,第一個小時:

dataset <- read_excel("Example.csv") 
hour = 1 
Production <- dataset[, 2] 
Company <- dataset[, 1] 
ggplot(data = dataset, aes(x = hour, y = Production, fill = Company)) + 
    geom_bar(stat = "identity") 

柱形圖如下圖所示:

​​

現在問題:

我寫了一段代碼來創建「公司」變量和「生產」變量的數據集。但是,當我運行的代碼,我有這樣的錯誤:

Aesthetics must be either length 1 or the same as the data (21): x, y, fill 

我想知道什麼技術錯誤我犯我,我怎麼能解決這個問題。 這是我的代碼:

hour <- matrix(0, 1, 2) 
hour[1, 1] = 1 
hour[1, 2] = 2 
Production <- matrix(0, 22, 2) 
for (i in 1:2) { 
    Production[1:22, i] <- dataset[1:22, (2 * i)] 
} 
Company <- matrix(0, 22, 2) 
for (i in 1:2) { 
    Company[1:22, i] <- dataset[1:22, (2 * i) - 1] 
} 

任何幫助將不勝感激。

+1

請提供該數據集是一種有用的格式。不是圖像,例如使用'dput(數據集)'。 – Deleet

+0

嘿Deleet,我剛發佈它。這有幫助嗎? –

+1

ggplot不喜歡矩陣;只有data.frames。您需要構建您的數據,以便每個審美是您data.frame中的單個變量。現在,這不是你所擁有的,你所擁有的東西還不清楚。 – alistaire

回答

0

從我所瞭解的問題中,您嘗試創建一個條形圖,顯示每個小時的公司生產時間,每個小時是不同的小時。

首先ggplot2與data.frames一起使用,其中每個變量都是不同的列,所以您的第一步應該是將您的數據轉換爲this format。有幾種方法可以做到這一點。

有了,這是很容易得到你所需要的:

ggplot(data = df2, aes(x = Hour, y = Production, fill = Company)) + 
    geom_bar(stat = 'identity') 

enter image description here

此外,你可能想消除疊置條重複的顏色,所以你可以看到該生產總量每個公司都更容易對於您將需要使用weight美學而不是identity統計的,就像這樣:

ggplot(data = df2, aes(x = Hour, weight = Production)) + 
    geom_bar(aes(fill = Company)) 

enter image description here

希望這有助於!

+0

你完全是我的男人!我也意識到了這一點。非常感謝!不能相信我花了這麼長時間才找出解決方法 –

0

目前尚不清楚你想要做什麼。例如。 data.frame中的變量沒有正確命名,並且Hour甚至不在data.frame中。

ggplot2要求所有變量都在您提供的data.frame中(即代碼中的dataset)。您正在創建數據框外有明智名稱的新對象。框架。您應該重命名變量。小時變量是長度爲1,所以目前還不清楚你想用它做什麼。

這是我能想出根據你的代碼的最佳:

#load data 
dataset = structure(list(X1 = structure(c(4L, 4L, 4L, 4L, 2L, 3L, 4L, 4L, 
1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L), .Label = c("", 
"B", "C", "D"), class = "factor"), X1.1 = c(5L, 73L, 86L, 30L, 
49L, 83L, 31L, 63L, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, NA, 
NA, NA), X2 = structure(c(4L, 2L, 4L, 4L, 2L, 4L, 4L, 2L, 3L, 
2L, 2L, 3L, 4L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L), .Label = c("", 
"A", "B", "D"), class = "factor"), X2.1 = c(71L, 74L, 5L, 73L, 
78L, 32L, 98L, 36L, 34L, 15L, 58L, 52L, 50L, NA, NA, NA, NA, 
NA, NA, NA, NA), X3 = structure(c(2L, 2L, 5L, 5L, 5L, 5L, 5L, 
5L, 5L, 5L, 4L, 5L, 4L, 3L, 3L, 1L, 1L, 1L, 1L, 1L, 1L), .Label = c("", 
"A", "B", "C", "D"), class = "factor"), X3.1 = c(33L, 85L, 11L, 
14L, 95L, 82L, 42L, 68L, 50L, 19L, 43L, 57L, 84L, 81L, 1L, NA, 
NA, NA, NA, NA, NA), X4 = structure(c(4L, 1L, 1L, 4L, 4L, 4L, 
4L, 1L, 1L, 4L, 4L, 3L, 3L, 3L, 4L, 2L, 2L, 4L, 2L, 4L, 4L), .Label = c("A", 
"B", "C", "D"), class = "factor"), X4.1 = c(100L, 81L, 48L, 97L, 
43L, 3L, 38L, 28L, 47L, 7L, 42L, 24L, 4L, 54L, 9L, 40L, 71L, 
28L, 2L, 69L, 64L), X5 = structure(c(5L, 5L, 3L, 5L, 5L, 5L, 
5L, 2L, 2L, 5L, 5L, 5L, 3L, 5L, 3L, 5L, 3L, 4L, 1L, 1L, 1L), .Label = c("", 
"A", "B", "C", "D"), class = "factor"), X5.1 = c(58L, 1L, 39L, 
68L, 45L, 78L, 0L, 97L, 60L, 25L, 60L, 12L, 34L, 30L, 0L, 73L, 
46L, 38L, NA, NA, NA), X6 = structure(c(3L, 4L, 3L, 5L, 5L, 3L, 
3L, 2L, 3L, 5L, 3L, 5L, 3L, 2L, 1L, 1L, 1L, 1L, 1L, 1L, 1L), .Label = c("", 
"A", "B", "C", "D"), class = "factor"), X6.1 = c(65L, 3L, 34L, 
48L, 70L, 96L, 4L, 68L, 42L, 95L, 29L, 8L, 1L, 92L, NA, NA, NA, 
NA, NA, NA, NA)), .Names = c("X1", "X1.1", "X2", "X2.1", "X3", 
"X3.1", "X4", "X4.1", "X5", "X5.1", "X6", "X6.1"), class = "data.frame", row.names = c(NA, 
-21L)) 

#rename and add Hour 
names(dataset)[1:2] = c("Company", "Production") 
dataset$Hour = 1 

#plot 
library(ggplot2) 
ggplot(dataset, aes(Hour, Production, fill = Company)) + 
    geom_bar(stat = "identity") 

的輸出是: enter image description here

考慮閱讀a textbook on R第一和the ggplot2 textbook

+0

刪除,感謝您的幫助。您在我的帖子中引用了您製作的輸出內容。但是,該輸出僅適用於數據的前兩列。如何創建另一個使用來自下兩列數據的數據的右側欄? 我也重新格式化了我的數據,並將其替換爲我編輯的帖子。謝謝 –