文本收集
# 工作路徑
# windows example
setwd("C:\\Users\\shukai\\Documents\\corpus")
# linux/MacOS example
setwd("~/Dropbox/Linguistic.Analysis.and.Data.Science/corpus")
# get listing of .txt files in directory
filenames <- list.files(getwd(), pattern="*.txt")
# read files into a character vector
files <- lapply(filenames, readLines)網頁成份擷取
Last updated