You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

35 lines
1.2 KiB

  1. import re
  2. from .common import InfoExtractor
  3. class InstagramIE(InfoExtractor):
  4. _VALID_URL = r'(?:http://)?instagram.com/p/(.*?)/'
  5. _TEST = {
  6. u'url': u'http://instagram.com/p/aye83DjauH/?foo=bar#abc',
  7. u'file': u'aye83DjauH.mp4',
  8. u'md5': u'0d2da106a9d2631273e192b372806516',
  9. u'info_dict': {
  10. u"uploader_id": u"naomipq",
  11. u"title": u"Video by naomipq",
  12. u'description': u'md5:1f17f0ab29bd6fe2bfad705f58de3cb8',
  13. }
  14. }
  15. def _real_extract(self, url):
  16. mobj = re.match(self._VALID_URL, url)
  17. video_id = mobj.group(1)
  18. webpage = self._download_webpage(url, video_id)
  19. uploader_id = self._search_regex(r'"owner":{"username":"(.+?)"',
  20. webpage, u'uploader id', fatal=False)
  21. desc = self._search_regex(r'"caption":"(.*?)"', webpage, u'description',
  22. fatal=False)
  23. return [{
  24. 'id': video_id,
  25. 'url': self._og_search_video_url(webpage),
  26. 'ext': 'mp4',
  27. 'title': u'Video by %s' % uploader_id,
  28. 'thumbnail': self._og_search_thumbnail(webpage),
  29. 'uploader_id' : uploader_id,
  30. 'description': desc,
  31. }]