array( 'required' => false, ), 'cache_timeout' => array( 'required' => false, ), ); const PARAMETERS = array( 'Username' => array( 'u' => array( 'name' => 'username', 'exampleValue' => 'aesoprockwins', 'required' => true ) ), 'Hashtag' => array( 'h' => array( 'name' => 'hashtag', 'exampleValue' => 'beautifulday', 'required' => true ) ), 'Location' => array( 'l' => array( 'name' => 'location', 'exampleValue' => 'london', 'required' => true ) ), 'global' => array( 'media_type' => array( 'name' => 'Media type', 'type' => 'list', 'required' => false, 'values' => array( 'All' => 'all', 'Video' => 'video', 'Picture' => 'picture', 'Multiple' => 'multiple', ), 'defaultValue' => 'all' ), 'direct_links' => array( 'name' => 'Use direct media links', 'type' => 'checkbox', ) ) ); const TEST_DETECT_PARAMETERS = array( 'https://www.instagram.com/metaverse' => array('u' => 'metaverse'), 'https://instagram.com/metaverse' => array('u' => 'metaverse'), 'http://www.instagram.com/metaverse' => array('u' => 'metaverse'), ); const USER_QUERY_HASH = '58b6785bea111c67129decbe6a448951'; const TAG_QUERY_HASH = '9b498c08113f1e09617a1703c22b2f32'; const SHORTCODE_QUERY_HASH = '865589822932d1b43dfe312121dd353a'; public function getCacheTimeout() { $customTimeout = $this->getOption('cache_timeout'); return $customTimeout || parent::getCacheTimeout(); } protected function getContents($uri) { $headers = array(); $sessionId = $this->getOption('session_id'); if ($sessionId) { $headers[] = 'cookie: sessionid=' . $sessionId; } return getContents($uri, $headers); } protected function getInstagramUserId($username) { if(is_numeric($username)) return $username; $cacheFac = new CacheFactory(); $cacheFac->setWorkingDir(PATH_LIB_CACHES); $cache = $cacheFac->create(Configuration::getConfig('cache', 'type')); $cache->setScope(get_called_class()); $cache->setKey(array($username)); $key = $cache->loadData(); if($key == null) { $data = $this->getContents(self::URI . 'web/search/topsearch/?query=' . $username); foreach(json_decode($data)->users as $user) { if(strtolower($user->user->username) === strtolower($username)) { $key = $user->user->pk; } } if($key == null) { returnServerError('Unable to find username in search result.'); } $cache->saveData($key); } return $key; } public function collectData(){ $directLink = !is_null($this->getInput('direct_links')) && $this->getInput('direct_links'); $data = $this->getInstagramJSON($this->getURI()); if(!is_null($this->getInput('u'))) { $userMedia = $data->data->user->edge_owner_to_timeline_media->edges; } elseif(!is_null($this->getInput('h'))) { $userMedia = $data->data->hashtag->edge_hashtag_to_media->edges; } elseif(!is_null($this->getInput('l'))) { $userMedia = $data->entry_data->LocationsPage[0]->graphql->location->edge_location_to_media->edges; } foreach($userMedia as $media) { $media = $media->node; switch($this->getInput('media_type')) { case 'all': break; case 'video': if($media->__typename != 'GraphVideo' || !$media->is_video) continue 2; break; case 'picture': if($media->__typename != 'GraphImage') continue 2; break; case 'multiple': if($media->__typename != 'GraphSidecar') continue 2; break; default: break; } $item = array(); $item['uri'] = self::URI . 'p/' . $media->shortcode . '/'; if (isset($media->owner->username)) { $item['author'] = $media->owner->username; } $textContent = $this->getTextContent($media); $item['title'] = ($media->is_video ? '▶ ' : '') . $textContent; $titleLinePos = strpos(wordwrap($item['title'], 120), "\n"); if ($titleLinePos != false) { $item['title'] = substr($item['title'], 0, $titleLinePos) . '...'; } if($directLink) { $mediaURI = $media->display_url; } else { $mediaURI = self::URI . 'p/' . $media->shortcode . '/media?size=l'; } switch($media->__typename) { case 'GraphSidecar': $data = $this->getInstagramSidecarData($item['uri'], $item['title'], $media, $textContent); $item['content'] = $data[0]; $item['enclosures'] = $data[1]; break; case 'GraphImage': $item['content'] = ''; $item['content'] .= '' . $item['title'] . ''; $item['content'] .= '

' . nl2br(htmlentities($textContent)); $item['enclosures'] = array($mediaURI); break; case 'GraphVideo': $data = $this->getInstagramVideoData($item['uri'], $mediaURI, $media, $textContent); $item['content'] = $data[0]; if($directLink) { $item['enclosures'] = $data[1]; } else { $item['enclosures'] = array($mediaURI); } $item['thumbnail'] = $mediaURI; break; default: break; } $item['timestamp'] = $media->taken_at_timestamp; $this->items[] = $item; } } // returns Sidecar(a post which has multiple media)'s contents and enclosures protected function getInstagramSidecarData($uri, $postTitle, $mediaInfo, $textContent) { $enclosures = array(); $content = ''; foreach($mediaInfo->edge_sidecar_to_children->edges as $singleMedia) { $singleMedia = $singleMedia->node; if($singleMedia->is_video) { if(in_array($singleMedia->video_url, $enclosures)) continue; // check if not added yet $content .= '
'; array_push($enclosures, $singleMedia->video_url); } else { if(in_array($singleMedia->display_url, $enclosures)) continue; // check if not added yet $content .= ''; $content .= '' . $postTitle . ''; $content .= '
'; array_push($enclosures, $singleMedia->display_url); } } $content .= '
' . nl2br(htmlentities($textContent)); return array($content, $enclosures); } // returns Video post's contents and enclosures protected function getInstagramVideoData($uri, $mediaURI, $mediaInfo, $textContent) { $content = '
'; $content .= '
' . nl2br(htmlentities($textContent)); return array($content, array($mediaInfo->video_url)); } protected function getTextContent($media) { $textContent = '(no text)'; //Process the first element, that isn't in the node graph if (count($media->edge_media_to_caption->edges) > 0) { $textContent = trim($media->edge_media_to_caption->edges[0]->node->text); } return $textContent; } protected function getInstagramJSON($uri) { if(!is_null($this->getInput('u'))) { $userId = $this->getInstagramUserId($this->getInput('u')); $data = $this->getContents(self::URI . 'graphql/query/?query_hash=' . self::USER_QUERY_HASH . '&variables={"id"%3A"' . $userId . '"%2C"first"%3A10}'); return json_decode($data); } elseif(!is_null($this->getInput('h'))) { $data = $this->getContents(self::URI . 'graphql/query/?query_hash=' . self::TAG_QUERY_HASH . '&variables={"tag_name"%3A"' . $this->getInput('h') . '"%2C"first"%3A10}'); return json_decode($data); } else { $html = getContents($uri); $scriptRegex = '/window\._sharedData = (.*);<\/script>/'; preg_match($scriptRegex, $html, $matches, PREG_OFFSET_CAPTURE, 0); return json_decode($matches[1][0]); } } public function getName(){ if(!is_null($this->getInput('u'))) { return $this->getInput('u') . ' - Instagram Bridge'; } return parent::getName(); } public function getURI(){ if(!is_null($this->getInput('u'))) { return self::URI . urlencode($this->getInput('u')) . '/'; } elseif(!is_null($this->getInput('h'))) { return self::URI . 'explore/tags/' . urlencode($this->getInput('h')); } elseif(!is_null($this->getInput('l'))) { return self::URI . 'explore/locations/' . urlencode($this->getInput('l')); } return parent::getURI(); } public function detectParameters($url){ $params = array(); // By username $regex = '/^(https?:\/\/)?(www\.)?instagram\.com\/([^\/?\n]+)/'; if(preg_match($regex, $url, $matches) > 0) { $params['u'] = urldecode($matches[3]); return $params; } return null; } }