• 设为首页
  • 点击收藏
  • 手机版
    手机扫一扫访问
    迪恩网络手机版
  • 关注官方公众号
    微信扫一扫关注
    迪恩网络公众号

Python utils.sanitize_url函数代码示例

原作者: [db:作者] 来自: [db:来源] 收藏 邀请

本文整理汇总了Python中r2.lib.utils.sanitize_url函数的典型用法代码示例。如果您正苦于以下问题:Python sanitize_url函数的具体用法?Python sanitize_url怎么用?Python sanitize_url使用的例子?那么恭喜您, 这里精选的函数代码示例或许可以为您提供帮助。



在下文中一共展示了sanitize_url函数的20个代码示例,这些例子默认根据受欢迎程度排序。您可以为喜欢或者感觉有用的代码点赞,您的评价将有助于我们的系统推荐出更棒的Python代码示例。

示例1: test_sanitize_url

    def test_sanitize_url(self):
        self.assertEquals(
            utils.sanitize_url('http://dk./'),
            'http://dk/'
        )

        self.assertEquals(
            utils.sanitize_url('http://google.com./'),
            'http://google.com/'
        )

        self.assertEquals(
            utils.sanitize_url('http://google.com/'),
            'http://google.com/'
        )

        self.assertEquals(
            utils.sanitize_url('https://github.com/reddit/reddit/pull/1302'),
            'https://github.com/reddit/reddit/pull/1302'
        )

        self.assertEquals(
            utils.sanitize_url('http://dk../'),
            None
        )
开发者ID:zeantsoi,项目名称:reddit,代码行数:25,代码来源:utils_test.py


示例2: link_equals

def link_equals(urla,urlb,fast=False):
    try:
        if not fast:
	    urla=urllib2.urlopen(HeadRequest(urla)).geturl()
            urlb=urllib2.urlopen(HeadRequest(urlb)).geturl()
	urla=sanitize_url(urla)
	urlb=sanitize_url(urlb)
	return urla==urlb
    except:
        pass
    return False
开发者ID:constantAmateur,项目名称:sciteit,代码行数:11,代码来源:sr_rss.py


示例3: run

    def run(self, url, sr = None):
        if sr is None and not isinstance(c.site, FakeSubreddit):
            sr = c.site
        elif sr:
            try:
                sr = Subreddit._by_name(str(sr))
            except (NotFound, UnicodeEncodeError):
                self.set_error(errors.SUBREDDIT_NOEXIST)
                sr = None
        else:
            sr = None

        if not url:
            return self.error(errors.NO_URL)
        url = utils.sanitize_url(url)
        if not url:
            return self.error(errors.BAD_URL)

        if url == 'self':
            if self.allow_self:
                return url
        elif not self.lookup:
            return url
        elif url:
            try:
                l = Link._by_url(url, sr)
                self.error(errors.ALREADY_SUB)
                return utils.tup(l)
            except NotFound:
                return url
        return self.error(errors.BAD_URL)
开发者ID:jaycobcoleman,项目名称:reddit,代码行数:31,代码来源:validator.py


示例4: GET_bookmarklet

    def GET_bookmarklet(self, what):
        '''Controller for the functionality of the bookmarklets (not the distribution page)'''
        action = ''
        for type in ['like', 'dislike', 'save']:
            if what.startswith(type):
                action = type
                break
            
        url = sanitize_url(request.get.u)
        uh = request.get.get('uh', "")

        try:
            links = Link._by_url(url)
        except:
            links = []

        Subreddit.load_subreddits(links, return_dict = False)
        user = c.user if c.user_is_loggedin else None
        links = [l for l in links if l.subreddit_slow.can_view(user)]

        if links and not c.user_is_loggedin:
            return self.redirect("/static/css_login.png")
        elif links and c.user_is_loggedin:
            if not c.user.valid_hash(uh):
                return self.redirect("/static/css_update.png")
            elif action in ['like', 'dislike']:
                #vote up all of the links
                for link in links:
                    Vote.vote(c.user, link, action == 'like', request.ip)
            elif action == 'save':
                link = max(links, key = lambda x: x._score)
                link._save(c.user)
            return self.redirect("/static/css_%sd.png" % action)
        return self.redirect("/static/css_submit.png")
开发者ID:cmak,项目名称:reddit,代码行数:34,代码来源:api.py


示例5: GET_search

    def GET_search(self, query, num, reverse, after, count, sort, restrict_sr):
        """Search links page."""
        if query and '.' in query:
            url = sanitize_url(query, require_scheme = True)
            if url:
                return self.redirect("/submit" + query_string({'url':url}))

        if not restrict_sr:
            site = DefaultSR()
        else:
            site = c.site

        try:
            q = IndextankQuery(query, site, sort)

            num, t, spane = self._search(q, num = num, after = after, reverse = reverse,
                                         count = count)
            res = SearchPage(_('search results'), query, t, num, content=spane,
                             nav_menus = [SearchSortMenu(default=sort)],
                             search_params = dict(sort = sort),
                             simple=False, site=c.site, restrict_sr=restrict_sr).render()

            return res
        except (IndextankException, socket.error), e:
            return self.search_fail(e)
开发者ID:donslice,项目名称:reddit,代码行数:25,代码来源:front.py


示例6: run

 def run(self, url, sr = None):
     if sr is None and not isinstance(c.site, FakeSubreddit):
         sr = c.site
     elif sr:
         try:
             sr = Subreddit._by_name(sr)
         except NotFound:
             c.errors.add(errors.SUBREDDIT_NOEXIST)
             sr = None
     else:
         sr = None
     
     if not url:
         return self.error(errors.NO_URL)
     url = utils.sanitize_url(url)
     if url == 'self':
         return url
     elif url:
         try:
             l = Link._by_url(url, sr)
             self.error(errors.ALREADY_SUB)
             return utils.tup(l)
         except NotFound:
             return url
     return self.error(errors.BAD_URL)
开发者ID:camspiers,项目名称:lesswrong,代码行数:25,代码来源:validator.py


示例7: GET_search

    def GET_search(self, query, num, reverse, after, count, sort):
        """Search links page."""
        if query and '.' in query:
            url = sanitize_url(query, require_scheme = True)
            if url:
                return self.redirect("/submit" + query_string({'url':url}))

        q = IndextankQuery(query, c.site, sort)

        num, t, spane = self._search(q, num = num, after = after, reverse = reverse,
                                     count = count)

        if not isinstance(c.site,FakeSubreddit) and not c.cname:
            all_reddits_link = "%s/search%s" % (subreddit.All.path,
                                                query_string({'q': query}))
            d =  {'reddit_name':      c.site.name,
                  'reddit_link':      "http://%s/"%get_domain(cname = c.cname),
                  'all_reddits_link': all_reddits_link}
            infotext = strings.searching_a_reddit % d
        else:
            infotext = None

        res = SearchPage(_('search results'), query, t, num, content=spane,
                         nav_menus = [SearchSortMenu(default=sort)],
                         search_params = dict(sort = sort),
                         infotext = infotext).render()

        return res
开发者ID:JediWatchman,项目名称:reddit,代码行数:28,代码来源:front.py


示例8: GET_search

    def GET_search(self, query, num, reverse, after, count, sort, restrict_sr):
        """Search links page."""
        if query and "." in query:
            url = sanitize_url(query, require_scheme=True)
            if url:
                return self.redirect("/submit" + query_string({"url": url}))

        if not restrict_sr:
            site = DefaultSR()
        else:
            site = c.site

        try:
            cleanup_message = None
            try:
                q = IndextankQuery(query, site, sort)
                if query:
                    query = query.replace("proddit:", "reddit:")

                q = IndextankQuery(query, site, sort)
                num, t, spane = self._search(q, num=num, after=after, reverse=reverse, count=count)
            except InvalidIndextankQuery:

                # strip the query down to a whitelist
                cleaned = re.sub("[^\w\s]+", "", query)
                cleaned = cleaned.lower()

                # if it was nothing but mess, we have to stop
                if not cleaned.strip():
                    num, t, spane = 0, 0, []
                    cleanup_message = strings.completely_invalid_search_query
                else:
                    q = IndextankQuery(cleaned, site, sort)

                    num, t, spane = self._search(q, num=num, after=after, reverse=reverse, count=count)
                    cleanup_message = strings.invalid_search_query % {"clean_query": cleaned}
                cleanup_message += " "
                cleanup_message += strings.search_help % {"search_help": self.search_help_page}

            if query:
                query = query.replace("reddit:", "proddit:")

            res = SearchPage(
                _("search results"),
                query,
                t,
                num,
                content=spane,
                nav_menus=[SearchSortMenu(default=sort)],
                search_params=dict(sort=sort),
                infotext=cleanup_message,
                simple=False,
                site=c.site,
                restrict_sr=restrict_sr,
            ).render()

            return res
        except (IndextankException, socket.error), e:

            return self.search_fail(e)
开发者ID:xolar,项目名称:proddit,代码行数:60,代码来源:front.py


示例9: GET_search

    def GET_search(self, query, num, reverse, after, count, sort, restrict_sr, syntax):
        """Search links page."""
        if query and "." in query:
            url = sanitize_url(query, require_scheme=True)
            if url:
                return self.redirect("/submit" + query_string({"url": url}))

        if not restrict_sr:
            site = DefaultSR()
        else:
            site = c.site

        if not syntax:
            syntax = SearchQuery.default_syntax

        try:
            cleanup_message = None
            try:
                q = SearchQuery(query, site, sort, syntax=syntax)
                results, etime, spane = self._search(q, num=num, after=after, reverse=reverse, count=count)
            except InvalidQuery:
                # Clean the search of characters that might be causing the
                # InvalidQuery exception. If the cleaned search boils down
                # to an empty string, the search code is expected to bail
                # out early with an empty result set.
                cleaned = re.sub("[^\w\s]+", " ", query)
                cleaned = cleaned.lower().strip()

                q = SearchQuery(cleaned, site, sort)
                results, etime, spane = self._search(q, num=num, after=after, reverse=reverse, count=count)
                if cleaned:
                    cleanup_message = strings.invalid_search_query % {"clean_query": cleaned}
                    cleanup_message += " "
                    cleanup_message += strings.search_help % {"search_help": self.search_help_page}
                else:
                    cleanup_message = strings.completely_invalid_search_query

            res = SearchPage(
                _("search results"),
                query,
                etime,
                results.hits,
                content=spane,
                nav_menus=[SearchSortMenu(default=sort)],
                search_params=dict(sort=sort),
                infotext=cleanup_message,
                simple=False,
                site=c.site,
                restrict_sr=restrict_sr,
                syntax=syntax,
                converted_data=q.converted_data,
                facets=results.subreddit_facets,
                sort=sort,
            ).render()

            return res
        except SearchException + (socket.error,) as e:
            return self.search_fail(e)
开发者ID:nod3x,项目名称:reddit,代码行数:58,代码来源:front.py


示例10: GET_search

    def GET_search(self, query, num, time, reverse, after, count, langs, sort):
        """Search links page."""
        if query and '.' in query:
            url = sanitize_url(query, require_scheme=True)
            if url:
                return self.redirect("/submit" + query_string({'url': url}))

        if langs and self.verify_langs_regex.match(langs):
            langs = langs.split(',')
        else:
            langs = c.content_langs

        subreddits = None
        authors = None
        if c.site == subreddit.Friends and c.user_is_loggedin and c.user.friends:
            authors = c.user.friends
        elif isinstance(c.site, MultiReddit):
            subreddits = c.site.sr_ids
        elif not isinstance(c.site, FakeSubreddit):
            subreddits = [c.site._id]

        q = LinkSearchQuery(
            q=query,
            timerange=time,
            langs=langs,
            subreddits=subreddits,
            authors=authors,
            sort=SearchSortMenu.operator(sort))

        num, t, spane = self._search(
            q, num=num, after=after, reverse=reverse, count=count)

        if not isinstance(c.site, FakeSubreddit) and not c.cname:
            all_reddits_link = "%s/search%s" % (subreddit.All.path,
                                                query_string({
                                                    'q': query
                                                }))
            d = {
                'reddit_name': c.site.name,
                'reddit_link': "http://%s/" % get_domain(cname=c.cname),
                'all_reddits_link': all_reddits_link
            }
            infotext = strings.searching_a_reddit % d
        else:
            infotext = None

        res = SearchPage(
            _('search results'),
            query,
            t,
            num,
            content=spane,
            nav_menus=[TimeMenu(default=time),
                       SearchSortMenu(default=sort)],
            search_params=dict(sort=sort, t=time),
            infotext=infotext).render()

        return res
开发者ID:szimpatikus,项目名称:szimpatikus.hu,代码行数:58,代码来源:front.py


示例11: find_dups

def find_dups(new,fast=True):
    """Check to see if anyone else is using the same feed...  If they are return the category, if not return none"""
    rss = get_sr_rss()
    new = sanitize_url(new)
    for k in [k for k in rss.keys() if rss[k]]:
        print rss[k]
        if link_equals(rss[k],new,fast=fast):
	    return k
    return None
开发者ID:constantAmateur,项目名称:sciteit,代码行数:9,代码来源:sr_rss.py


示例12: GET_search

    def GET_search(self, query, num, reverse, after, count, sort, restrict_sr,
                   syntax):
        """Search links page."""
        if query and '.' in query:
            url = sanitize_url(query, require_scheme = True)
            if url:
                return self.redirect("/submit" + query_string({'url':url}))

        if not restrict_sr:
            site = DefaultSR()
        else:
            site = c.site
        
        if not syntax:
            syntax = SearchQuery.default_syntax

        try:
            cleanup_message = None
            try:
                q = SearchQuery(query, site, sort, syntax=syntax)
                num, t, spane = self._search(q, num=num, after=after, 
                                             reverse = reverse, count = count)
            except InvalidQuery:
                # strip the query down to a whitelist
                cleaned = re.sub("[^\w\s]+", " ", query)
                cleaned = cleaned.lower()

                # if it was nothing but mess, we have to stop
                if not cleaned.strip():
                    num, t, spane = 0, 0, []
                    cleanup_message = strings.completely_invalid_search_query
                else:
                    q = SearchQuery(cleaned, site, sort)
                    num, t, spane = self._search(q, num=num, after=after,
                                                 reverse=reverse, count=count)
                    cleanup_message = strings.invalid_search_query % {
                                          "clean_query": cleaned
                                      }
                cleanup_message += " "
                cleanup_message += strings.search_help % {"search_help":
                                                          self.search_help_page
                                                          }
            
            res = SearchPage(_('search results'), query, t, num, content=spane,
                             nav_menus=[SearchSortMenu(default=sort)],
                             search_params=dict(sort=sort),
                             infotext=cleanup_message,
                             simple=False, site=c.site,
                             restrict_sr=restrict_sr,
                             syntax=syntax,
                             converted_data=q.converted_data
                             ).render()

            return res
        except SearchException + (socket.error,) as e:
            return self.search_fail(e)
开发者ID:DanHoerst,项目名称:reddit,代码行数:56,代码来源:front.py


示例13: fetch_feed

def fetch_feed(rss):
    if rss:
        rss=sanitize_url(rss)
        if rss:
	    try:
	        return feedparser.parse(rss)
	    except:
	        pass
    print "Invalid feed."
    return None
开发者ID:constantAmateur,项目名称:sciteit,代码行数:10,代码来源:sr_rss.py


示例14: _extract_isolated_urls

def _extract_isolated_urls(md):
    """Extract URLs that exist on their own lines in given markdown.

    This style borrowed from wordpress, which is nice because it's tolerant to
    failures and is easy to understand. See https://codex.wordpress.org/Embeds

    """
    urls = []
    for line in md.splitlines():
        url = sanitize_url(line, require_scheme=True)
        if url and url != "self":
            urls.append(url)
    return urls
开发者ID:madbook,项目名称:reddit-plugin-liveupdate,代码行数:13,代码来源:media_embeds.py


示例15: demangle_url

def demangle_url(path):
    # there's often some URL mangling done by the stack above us, so
    # let's clean up the URL before looking it up
    path = strip_sr.sub('', path)
    path = strip_s_path.sub('', path)
    path = leading_slash.sub("", path)

    if not has_protocol.match(path):
        path = 'http://%s' % path

    if need_insert_slash.match(path):
        path = string.replace(path, '/', '//', 1)

    path = utils.sanitize_url(path)

    return path
开发者ID:DFectuoso,项目名称:culter,代码行数:16,代码来源:toolbar.py


示例16: run

 def run(self, url, sr):
     sr =  Subreddit._by_name(sr)
     
     if not url:
         return self.error(errors.NO_URL)
     url = utils.sanitize_url(url)
     if url == 'self':
         return url
     elif url:
         try:
             l = Link._by_url(url, sr)
             self.error(errors.ALREADY_SUB)
             return l.url
         except NotFound:
             return url
     return self.error(errors.BAD_URL)
开发者ID:cmak,项目名称:reddit,代码行数:16,代码来源:validator.py


示例17: validate_link

def validate_link(url,whitelist=False):
    if url:
        url=sanitize_url(url)
        if url:
	    if whitelist and domain(url) not in DOMAIN_WHITELIST:
	        print "Domain %s not in whitelist." % domain(url)
		return False
            try:
                lbu = LinksByUrl._byID(LinksByUrl._key_from_url(url))
            except tdb_cassandra.NotFound:
                return url
            link_id36s = lbu._values()
	    links = Link._byID36(link_id36s, data=True, return_dict=False)
	    links = [l for l in links if not l._deleted]
	    if len(links)==0:
	        return url
	    print "Link %s exists..." % url
    return False 
开发者ID:constantAmateur,项目名称:sciteit,代码行数:18,代码来源:sr_rss.py


示例18: GET_search

    def GET_search(self, query, num, reverse, after, count, sort, restrict_sr):
        """Search links page."""
        if query and '.' in query:
            url = sanitize_url(query, require_scheme = True)
            if url:
                return self.redirect("/submit" + query_string({'url':url}))

        if not restrict_sr:
            site = DefaultSR()
        else:
            site = c.site

        try:
            cleanup_message = None
            try:
                q = IndextankQuery(query, site, sort)
                num, t, spane = self._search(q, num=num, after=after, 
                                             reverse = reverse, count = count)
            except InvalidIndextankQuery:
                # delete special characters from the query and run again
                special_characters = '+-&|!(){}[]^"~*?:\\'
                translation = dict((ord(char), None) 
                                   for char in list(special_characters))
                cleaned = query.translate(translation)

                q = IndextankQuery(cleaned, site, sort)
                num, t, spane = self._search(q, num=num, after=after, 
                                             reverse = reverse, count = count)
                cleanup_message = _('I couldn\'t understand your query, ' +
                                    'so I simplified it and searched for ' + 
                                    '"%(clean_query)s" instead.') % {
                                        'clean_query': cleaned }
		
            res = SearchPage(_('search results'), query, t, num, content=spane,
                             nav_menus = [SearchSortMenu(default=sort)],
                             search_params = dict(sort = sort), 
                             infotext=cleanup_message,
                             simple=False, site=c.site, 
                             restrict_sr=restrict_sr).render()

            return res
        except (IndextankException, socket.error), e:
            return self.search_fail(e)
开发者ID:VincentVazzo,项目名称:reddit,代码行数:43,代码来源:front.py


示例19: GET_search

    def GET_search(self, query, num, time, reverse, after, count, langs):
        """Search links page."""
        if query and '.' in query:
            url = sanitize_url(query, require_scheme = True)
            if url:
                return self.redirect("/submit" + query_string({'url':url}))

        if langs and self.verify_langs_regex.match(langs):
            langs = langs.split(',')
        else:
            langs = None

        num, t, spane = self._search(query, time=time,
                                     num = num, after = after, 
                                     reverse = reverse,
                                     count = count, types = [Link])

        res = SearchPage(_('search results'), query, t, num, content=spane,
                         nav_menus = [TimeMenu(default = time)]).render()
        
        return res
开发者ID:cmak,项目名称:reddit,代码行数:21,代码来源:front.py


示例20: demangle_url

def demangle_url(path):
    # there's often some URL mangling done by the stack above us, so
    # let's clean up the URL before looking it up
    path = strip_sr.sub('', path)
    path = strip_s_path.sub('', path)
    path = leading_slash.sub("", path)

    if has_protocol.match(path):
        if not allowed_protocol.match(path):
            return None
    else:
        path = '%s://%s' % (g.default_scheme, path)

    if need_insert_slash.match(path):
        path = string.replace(path, '/', '//', 1)

    try:
        path = utils.sanitize_url(path)
    except TypeError:
        return None

    return path
开发者ID:AHAMED750,项目名称:reddit,代码行数:22,代码来源:toolbar.py



注:本文中的r2.lib.utils.sanitize_url函数示例由纯净天空整理自Github/MSDocs等源码及文档管理平台,相关代码片段筛选自各路编程大神贡献的开源项目,源码版权归原作者所有,传播和使用请参考对应项目的License;未经允许,请勿转载。


鲜花

握手

雷人

路过

鸡蛋
该文章已有0人参与评论

请发表评论

全部评论

专题导读
上一篇:
Python utils.set_last_modified函数代码示例发布时间:2022-05-26
下一篇:
Python utils.randstr函数代码示例发布时间:2022-05-26
热门推荐
阅读排行榜

扫描微信二维码

查看手机版网站

随时了解更新最新资讯

139-2527-9053

在线客服(服务时间 9:00~18:00)

在线QQ客服
地址:深圳市南山区西丽大学城创智工业园
电邮:jeky_zhao#qq.com
移动电话:139-2527-9053

Powered by 互联科技 X3.4© 2001-2213 极客世界.|Sitemap