https://jabbalaci.herokuapp.com/all_links?url=<YOUR_URL>

add clustering

 
Notes:
  • duplicates are removed
  • try with and without clustering

Python API:
#!/usr/bin/env python

import re
import requests
import json

BASE = "https://jabbalaci.herokuapp.com/all_links"


def get_links(url, pattern=r''):
    """
    Get all links on a webpage.

    With the optional pattern you can filter the result.
    """
    r = requests.get("{base}?url={dest}".format(base=BASE, dest=url))
    li = sorted(set([url for url in r.json()['urls'] if re.search(pattern, url)]))
    return li

##############################################################

if __name__ == "__main__":
    print get_links("http://www.reddit.com", r'^https://')