2017-10-21 56 views
0
import net.ruippeixotog.scalascraper.browser.JsoupBrowser 
import net.ruippeixotog.scalascraper.dsl.DSL._ 
import net.ruippeixotog.scalascraper.dsl.DSL.Extract._ 
import net.ruippeixotog.scalascraper.dsl.DSL.Parse._ 

object Scraper { 
    val browser = JsoupBrowser() 

    val doc = browser.get("http://camhr.com") 

    def main(args: Array[String]): Unit = { 
    // Extract the <span> elements inside #menu 
    val items = doc >?> element("#footer") 
    print(items) 

    } 

} 

我在网站上看到的是英文,但是当我运行此代码时,我在控制台(IntelliJ IDE)中获得中文。错误的输出编码渲染与scalascraper

如何获得正确的英文文本渲染?

回答

1

尝试用这样的事情:

val url = "http://camhr.com" 

val doc = Jsoup.connect(url) 
    .header("Accept-Language", "en") 
    .get