com.beachape.metascraper

ScraperActor

class ScraperActor extends Actor with Logging

Actor for scraping metadata from websites at URLs

Should be instantiated with Props provided via companion object factory method

Linear Supertypes
Logging, Actor, AnyRef, Any
Ordering
  1. Alphabetic
  2. By inheritance
Inherited
  1. ScraperActor
  2. Logging
  3. Actor
  4. AnyRef
  5. Any
  1. Hide All
  2. Show all
Learn more about member selection
Visibility
  1. Public
  2. All

Instance Constructors

  1. new ScraperActor()

Type Members

  1. type Receive = PartialFunction[Any, Unit]

    Definition Classes
    Actor

Value Members

  1. final def !=(arg0: AnyRef): Boolean

    Definition Classes
    AnyRef
  2. final def !=(arg0: Any): Boolean

    Definition Classes
    Any
  3. final def ##(): Int

    Definition Classes
    AnyRef → Any
  4. final def ==(arg0: AnyRef): Boolean

    Definition Classes
    AnyRef
  5. final def ==(arg0: Any): Boolean

    Definition Classes
    Any
  6. final def asInstanceOf[T0]: T0

    Definition Classes
    Any
  7. def clone(): AnyRef

    Attributes
    protected[java.lang]
    Definition Classes
    AnyRef
    Annotations
    @throws( ... )
  8. implicit val context: ActorContext

    Definition Classes
    Actor
  9. final def eq(arg0: AnyRef): Boolean

    Definition Classes
    AnyRef
  10. def equals(arg0: Any): Boolean

    Definition Classes
    AnyRef → Any
  11. def extractDescription(doc: Document): String

    Returns the description of a Jsoup document

    Returns the description of a Jsoup document

    Prioritises <meta property="og:description" .. > tag over <meta name="description" .. > tag

    doc

    Document as parsed by JSoup

    returns

    String description

  12. def extractImages(doc: Document, takeFirst: Int = 5): Seq[String]

    Returns a best guess for the best images of a Jsoup document

    Returns a best guess for the best images of a Jsoup document

    * Prioritises <meta property="og:image" .. > tags over tags

    doc

    Document as parsed by Jsoup

    takeFirst

    Number of elements to take, defaults to 5

    returns

    Seq[String] collection of image urls

  13. def extractMainImage(doc: Document): String

    Returns a best guess for the url of the main Image of a Jsoup document

    Returns a best guess for the url of the main Image of a Jsoup document

    Prioritises the first <meta property="og:image" .. > tag over the first tag

    doc

    Document as parsed by JSoup

    returns

    String url of the main image

  14. def extractScrapedData(doc: Document, accessedUrl: String): ScrapedData

    Returns a ScrapedData object filled out using data extracted from a JSoup document

    Returns a ScrapedData object filled out using data extracted from a JSoup document

    Prioritises Open Graph tags https://developers.facebook.com/docs/opengraph/ over conventional tags like <title>

    doc

    Document as parsed by JSoup

    returns

    ScrapedData

  15. def extractTitle(doc: Document): String

    Returns the title of a Jsoup document

    Returns the title of a Jsoup document

    Prioritises <meta property="og:title" .. > tag over <title> tag

    doc

    Document as parsed by JSoup

    returns

    String title

  16. def extractUrl(doc: Document, accessedUrl: String): String

    Returns the url of a Jsoup document

    Returns the url of a Jsoup document

    Prioritises <meta property="og:url" .. > tag over the url used to access this document

    doc

    Document as parsed by JSoup

    returns

    String url

  17. def finalize(): Unit

    Attributes
    protected[java.lang]
    Definition Classes
    AnyRef
    Annotations
    @throws( classOf[java.lang.Throwable] )
  18. final def getClass(): Class[_]

    Definition Classes
    AnyRef → Any
  19. def hashCode(): Int

    Definition Classes
    AnyRef → Any
  20. final def isInstanceOf[T0]: Boolean

    Definition Classes
    Any
  21. lazy val logger: Logger

    Attributes
    protected
    Definition Classes
    Logging
  22. final def ne(arg0: AnyRef): Boolean

    Definition Classes
    AnyRef
  23. final def notify(): Unit

    Definition Classes
    AnyRef
  24. final def notifyAll(): Unit

    Definition Classes
    AnyRef
  25. def postRestart(reason: Throwable): Unit

    Definition Classes
    Actor
    Annotations
    @throws( classOf[java.lang.Exception] )
  26. def postStop(): Unit

    Definition Classes
    Actor
    Annotations
    @throws( classOf[java.lang.Exception] )
  27. def preRestart(reason: Throwable, message: Option[Any]): Unit

    Definition Classes
    Actor
    Annotations
    @throws( classOf[java.lang.Exception] )
  28. def preStart(): Unit

    Definition Classes
    Actor
    Annotations
    @throws( classOf[java.lang.Exception] )
  29. def receive: PartialFunction[Any, Unit]

    Definition Classes
    ScraperActor → Actor
  30. implicit final val self: ActorRef

    Definition Classes
    Actor
  31. final def sender: ActorRef

    Definition Classes
    Actor
  32. def supervisorStrategy: SupervisorStrategy

    Definition Classes
    Actor
  33. final def synchronized[T0](arg0: ⇒ T0): T0

    Definition Classes
    AnyRef
  34. def toString(): String

    Definition Classes
    AnyRef → Any
  35. def unhandled(message: Any): Unit

    Definition Classes
    Actor
  36. final def wait(): Unit

    Definition Classes
    AnyRef
    Annotations
    @throws( ... )
  37. final def wait(arg0: Long, arg1: Int): Unit

    Definition Classes
    AnyRef
    Annotations
    @throws( ... )
  38. final def wait(arg0: Long): Unit

    Definition Classes
    AnyRef
    Annotations
    @throws( ... )

Inherited from Logging

Inherited from Actor

Inherited from AnyRef

Inherited from Any

Ungrouped