把博客文章里的内容都搬到随笔这里来啦~~~~~~~~~~~~~·用R读取各类文件其实很简单,只是有时候要注意一下加载library的顺序,不过没事,一般系统都会提醒你哒!
---------------------------------
#读取txt文件
bank1 <- read.table('user_info.txt',
header = F,
sep = ',',
na.strings = 'null',
encoding = 'utf8')
head(bank1)
#读取csv文件
bank2 <- read.csv('SegData.csv',
header = F,
sep = ',',
na.strings = 'null',
encoding = 'utf8')
head(bank2)
#读取excel文件
install.packages('xlsx')
library(xlsxjars)
library(rJava)
library(xlsx)
bank3 <- read.xlsx('SegData.xlsx',
sheetName = 'SegData2',
header = F)
head(bank3)
#读取XML文件
install.packages('XML')
install.packages('methods')
install.packages('RMySQL')
library(XML)
library(methods)
bank4 <- xmlTreeParse(file = 'input.xml')
head(bank4)
xmlToDataFrame('input.xml')
#读取json文件
install.packages('rJson')
library(rjson)
bank5 <- fromJSON(file='input.json')
head(bank5)
json_data_frame <- as.data.frame(bank5)
head(json_data_frame)
#SegData中提取收入5W~10W,拥有房产的用户。
library(xlsxjars)
library(rJava)
library(xlsx)
mydata <- read.xlsx('SegData.xlsx',1)
head(mydata)
mydata[mydata$house=="Yes"&mydata$income>=50000&mydata$income<100000,]