Browsers¶

`PageSourceGetter` ¶

Bases: ABC

All browsers must inherit from this class

Source code in extract_emails/browsers/page_source_getter.py

class PageSourceGetter(ABC):
    """All browsers must inherit from this class"""

    def __enter__(self) -> PageSourceGetter:
        """Context manager enter method.

        Returns:
            Self instance for method chaining
        """
        self.start()
        return self

    def __exit__(self, exc_type, exc_val, exc_tb) -> None:
        """Context manager exit method.

        Args:
            exc_type: Exception type
            exc_val: Exception value
            exc_tb: Exception traceback
        """
        self.stop()

    async def __aenter__(self) -> PageSourceGetter:
        """Async context manager enter method.

        Returns:
            Self instance for method chaining
        """
        await self.astart()
        return self

    async def __aexit__(self, exc_type, exc_val, exc_tb) -> None:
        """Async context manager exit method.

        Args:
            exc_type: Exception type
            exc_val: Exception value
            exc_tb: Exception traceback
        """
        await self.astop()

    @abstractmethod
    def start(self) -> None: ...

    @abstractmethod
    def stop(self) -> None: ...

    @abstractmethod
    async def astart(self) -> None: ...

    @abstractmethod
    async def astop(self) -> None: ...

    @abstractmethod
    def get_page_source(self, url: str) -> str:
        """Return page content from an URL

        Args:
            url: URL

        Returns:
            page content (html, json, whatever)
        """
        ...

    @abstractmethod
    async def aget_page_source(self, url: str) -> str:
        """Return page content from an URL asynchronously

        Args:
            url: URL

        Returns:
            page content (html, json, whatever)
        """
        ...

`aenter()` `async` ¶

Async context manager enter method.

Returns:

Type	Description
`PageSourceGetter`	Self instance for method chaining

Source code in extract_emails/browsers/page_source_getter.py

async def __aenter__(self) -> PageSourceGetter:
    """Async context manager enter method.

    Returns:
        Self instance for method chaining
    """
    await self.astart()
    return self

`aexit(exc_type, exc_val, exc_tb)` `async` ¶

Async context manager exit method.

Parameters:

Name	Description	Default
`exc_type`	Exception type	required
`exc_val`	Exception value	required
`exc_tb`	Exception traceback	required

Source code in extract_emails/browsers/page_source_getter.py

async def __aexit__(self, exc_type, exc_val, exc_tb) -> None:
    """Async context manager exit method.

    Args:
        exc_type: Exception type
        exc_val: Exception value
        exc_tb: Exception traceback
    """
    await self.astop()

`enter()` ¶

Context manager enter method.

Returns:

Type	Description
`PageSourceGetter`	Self instance for method chaining

Source code in extract_emails/browsers/page_source_getter.py

def __enter__(self) -> PageSourceGetter:
    """Context manager enter method.

    Returns:
        Self instance for method chaining
    """
    self.start()
    return self

`exit(exc_type, exc_val, exc_tb)` ¶

Context manager exit method.

Parameters:

Name	Description	Default
`exc_type`	Exception type	required
`exc_val`	Exception value	required
`exc_tb`	Exception traceback	required

Source code in extract_emails/browsers/page_source_getter.py

def __exit__(self, exc_type, exc_val, exc_tb) -> None:
    """Context manager exit method.

    Args:
        exc_type: Exception type
        exc_val: Exception value
        exc_tb: Exception traceback
    """
    self.stop()

`aget_page_source(url)` `abstractmethod` `async` ¶

Return page content from an URL asynchronously

Parameters:

Name	Type	Description	Default
`url`	`str`	URL	required

Returns:

Type	Description
`str`	page content (html, json, whatever)

Source code in extract_emails/browsers/page_source_getter.py

@abstractmethod
async def aget_page_source(self, url: str) -> str:
    """Return page content from an URL asynchronously

    Args:
        url: URL

    Returns:
        page content (html, json, whatever)
    """
    ...

`get_page_source(url)` `abstractmethod` ¶

Return page content from an URL

Parameters:

Name	Type	Description	Default
`url`	`str`	URL	required

Returns:

Type	Description
`str`	page content (html, json, whatever)

Source code in extract_emails/browsers/page_source_getter.py

@abstractmethod
def get_page_source(self, url: str) -> str:
    """Return page content from an URL

    Args:
        url: URL

    Returns:
        page content (html, json, whatever)
    """
    ...

Browsers¶

PageSourceGetter ¶

__aenter__() async ¶

__aexit__(exc_type, exc_val, exc_tb) async ¶

__enter__() ¶

__exit__(exc_type, exc_val, exc_tb) ¶

aget_page_source(url) abstractmethod async ¶

get_page_source(url) abstractmethod ¶

`PageSourceGetter` ¶

`aenter()` `async` ¶

`aexit(exc_type, exc_val, exc_tb)` `async` ¶

`enter()` ¶

`exit(exc_type, exc_val, exc_tb)` ¶

`aget_page_source(url)` `abstractmethod` `async` ¶

`get_page_source(url)` `abstractmethod` ¶