資源簡介
Python數據挖掘入門與實踐.zip (code)
代碼片段和文件信息
import?os
import?re
from?mrjob.job?import?MRJob
from?mrjob.step?import?MRStep
word_search_re?=?re.compile(r“[\w‘]+“)
class?ExtractPosts(MRJob):
????post_start?=?False
????post?=?[]
????def?mapper(self?key?line):
????????filename?=?os.environ[“map_input_file“]
????????gender?=?filename.split(“.“)[1]
????????try:
????????????docnum?=?int(filename[0])
????????except:
????????????docnum?=?8
????????if?filename.startswith(“51“):
????????????#?remove?leading?and?trailing?whitespace
????????????line?=?line.strip()
????????????if?line?==?““:
????????????????self.post_start?=?True
????????????elif?line?==?“ “:
????????????????self.post_start?=?False
????????????????yield?gender?repr(“\n“.join(self.post))
????????????????self.post?=?[]
????????????elif?self.post_start:
????????????????self.post.append(line)
if?__name__?==?‘__main__‘:
????ExtractPosts.run()
?屬性????????????大小?????日期????時間???名稱
-----------?---------??----------?-----??----
?????目錄???????????0??2018-03-06?19:04??#Python數據挖掘入門與實踐\
?????目錄???????????0??2018-03-09?17:16??#Python數據挖掘入門與實踐\Code_REWRITE\
?????目錄???????????0??2017-10-11?14:15??#Python數據挖掘入門與實踐\Code_REWRITE\Chapter?1\
?????目錄???????????0??2017-10-11?14:15??#Python數據挖掘入門與實踐\Code_REWRITE\Chapter?10\
?????目錄???????????0??2017-10-11?14:15??#Python數據挖掘入門與實踐\Code_REWRITE\Chapter?10\.ipynb_checkpoints\
?????文件??????434745??2015-06-28?15:31??#Python數據挖掘入門與實踐\Code_REWRITE\Chapter?10\.ipynb_checkpoints\Chapter?10?(Cluster?Types)-checkpoint.ipynb
?????文件???????64766??2015-06-28?15:36??#Python數據挖掘入門與實踐\Code_REWRITE\Chapter?10\.ipynb_checkpoints\Chapter?10?Clusterer-checkpoint.ipynb
?????文件?????1100672??2015-06-28?15:34??#Python數據挖掘入門與實踐\Code_REWRITE\Chapter?10\.ipynb_checkpoints\Chapter?10?Image?creation?10_02.png-checkpoint.ipynb
?????文件??????????72??2015-06-28?15:29??#Python數據挖掘入門與實踐\Code_REWRITE\Chapter?10\.ipynb_checkpoints\Chapter?10-checkpoint.ipynb
?????文件???????78925??2015-06-28?15:40??#Python數據挖掘入門與實踐\Code_REWRITE\Chapter?10\Chapter?10?Clusterer.ipynb
?????目錄???????????0??2017-10-11?14:15??#Python數據挖掘入門與實踐\Code_REWRITE\Chapter?11\
?????文件???????58837??2015-06-28?15:17??#Python數據挖掘入門與實踐\Code_REWRITE\Chapter?11\Chapter?11?(CIFAR).ipynb
?????文件???????62409??2015-06-28?15:02??#Python數據挖掘入門與實踐\Code_REWRITE\Chapter?11\Chapter?11?(Theano?and?Lasagne).ipynb
?????目錄???????????0??2017-10-11?14:15??#Python數據挖掘入門與實踐\Code_REWRITE\Chapter?12\
?????文件???????38759??2015-06-28?15:22??#Python數據挖掘入門與實踐\Code_REWRITE\Chapter?12\CH12?MapReduce?Basics.ipynb
?????文件???????10578??2015-05-08?19:56??#Python數據挖掘入門與實踐\Code_REWRITE\Chapter?12\Chapter?12?(NB?Predict).ipynb
?????文件????????1730??2015-05-08?06:35??#Python數據挖掘入門與實踐\Code_REWRITE\Chapter?12\Chapter?12?(Test?load).ipynb
?????文件?????????882??2015-05-08?16:49??#Python數據挖掘入門與實踐\Code_REWRITE\Chapter?12\extract_posts.py
?????文件????????1986??2015-05-08?09:37??#Python數據挖掘入門與實踐\Code_REWRITE\Chapter?12\nb_predict.py
?????文件????????2021??2015-05-08?08:44??#Python數據挖掘入門與實踐\Code_REWRITE\Chapter?12\nb_train.py
?????目錄???????????0??2017-10-11?14:15??#Python數據挖掘入門與實踐\Code_REWRITE\Chapter?1\.ipynb_checkpoints\
?????文件???????14242??2015-05-28?09:33??#Python數據挖掘入門與實踐\Code_REWRITE\Chapter?1\.ipynb_checkpoints\ch1_affinity-checkpoint.ipynb
?????文件???????13797??2015-05-28?09:33??#Python數據挖掘入門與實踐\Code_REWRITE\Chapter?1\.ipynb_checkpoints\ch1_oner_application-checkpoint.ipynb
?????文件????????1000??2014-10-10?03:13??#Python數據挖掘入門與實踐\Code_REWRITE\Chapter?1\affinity_dataset.txt
?????文件???????14242??2015-05-28?09:33??#Python數據挖掘入門與實踐\Code_REWRITE\Chapter?1\ch1_affinity.ipynb
?????文件????????3544??2014-10-10?03:13??#Python數據挖掘入門與實踐\Code_REWRITE\Chapter?1\ch1_affinity_create.ipynb
?????文件???????14210??2017-10-11?06:29??#Python數據挖掘入門與實踐\Code_REWRITE\Chapter?1\ch1_oner_application.ipynb
?????目錄???????????0??2017-10-11?14:15??#Python數據挖掘入門與實踐\Code_REWRITE\Chapter?2\
?????目錄???????????0??2017-10-11?14:15??#Python數據挖掘入門與實踐\Code_REWRITE\Chapter?2\.ipynb_checkpoints\
?????文件??????128669??2015-05-28?10:08??#Python數據挖掘入門與實踐\Code_REWRITE\Chapter?2\.ipynb_checkpoints\Ionosphere?Nearest?Neighbour-checkpoint.ipynb
?????文件??????129473??2017-10-11?13:23??#Python數據挖掘入門與實踐\Code_REWRITE\Chapter?2\Ionosphere?Nearest?Neighbour.ipynb
............此處省略40個文件信息
評論
共有 條評論