scala 并行集合:为工作线程使用线程局部变量的惯用方法



下面的进度函数是我的工作函数。我需要让它访问一些创建/获取成本高昂的类。库中是否有线程局部变量的标准机制?还是我必须自己编写对象池管理器?

object Start extends App {
    def progress {
        val current = counter.getAndIncrement
        if(current % 100 == 0) {
            val perc = current.toFloat * 100 / totalPosts
            print(f"r$perc%4.2f%%")
        }
    }
    val lexicon = new Global()
    def processTopic(forumId: Int, topicId: Int) {
        val(topic, posts) = ProcessingQueries.getTopicAndPosts(forumId,topicId)
        progress
    }

    val (fid, tl) = ProcessingQueries.getAllTopics("hon")
    val totalPosts = tl.size
    val counter = new AtomicInteger(0)
    val par = tl.par
    par.foreach { topic_id =>
        processTopic(fid,topic_id)
    }
}

替换了之前的答案。这把戏既漂亮又整洁

object MyAnnotator extends ThreadLocal[StanfordCoreNLP] {
    val props = new Properties()
    props.put("annotators", "tokenize,ssplit,pos,lemma,parse")
    props.put("ssplit.newlineIsSentenceBreak", "two")
    props.put("parse.maxlen", "40")
    override def initialValue = new StanfordCoreNLP(props)
  }

相关内容

  • 没有找到相关文章

最新更新