锘??xml version="1.0" encoding="utf-8" standalone="yes"?>久久久久久久久波多野高潮,欧美伊香蕉久久综合类网站,7777久久亚洲中文字幕http://www.shnenglu.com/gaimor/category/20048.html涓氫綑CPP涓撳zh-cnSun, 08 Dec 2013 00:35:58 GMTSun, 08 Dec 2013 00:35:58 GMT60C璇█璋冪敤python鑴氭湰3http://www.shnenglu.com/gaimor/archive/2013/12/07/204649.htmlccsdu2009ccsdu2009Sat, 07 Dec 2013 07:48:00 GMThttp://www.shnenglu.com/gaimor/archive/2013/12/07/204649.htmlhttp://www.shnenglu.com/gaimor/comments/204649.htmlhttp://www.shnenglu.com/gaimor/archive/2013/12/07/204649.html#Feedback0http://www.shnenglu.com/gaimor/comments/commentRss/204649.htmlhttp://www.shnenglu.com/gaimor/services/trackbacks/204649.html
from bs4 import BeautifulSoup

def list_get(file):
    soup 
= BeautifulSoup(open(file))
    alist 
= soup.find_all('a',class_ = 'link')
    list 
= []
    
for i in alist:
        list.append(i.
get('href'));
    #
for i in list:
    #    print(i)
    
return list

if __name__=="__main__":
    list_get(
'List.htm')

list_get鍑芥暟榪斿洖鐨勬槸list瀛楃涓插璞?br />鍏禼璇█璋冪敤鐨勪唬鐮佸涓?
#include <stdio.h>
#include 
<stdlib.h>
#include 
<Python.h>

char* GDALPythonObjectToCStr(PyObject* pyObject);

int main(int argc, char *argv[])
{
    Py_Initialize();  
    
if(!Py_IsInitialized())   
    {  
        
return -1;  
    }  
    
    PyRun_SimpleString(
"import sys");
    PyRun_SimpleString(
"sys.path.append('./script')");
    PyObject
* pModule;
    PyObject
* pDict;
    PyObject
* pFunc;

    pModule 
= PyImport_ImportModule("list");
    
if(!pModule)
    {
        printf(
"can't find list.py");
        system(
"PAUSE"); 
        getchar();
        
return -1;
    }
    
    pDict 
= PyModule_GetDict(pModule);
    
if(!pDict)
    {
        
return -1;
    }
    
    pFunc 
= PyDict_GetItemString(pDict,"list_get");
    
if(!pFunc || !PyCallable_Check(pFunc))
    {
        printf(
"can't find function [list_get]");
        getchar();
        
return -1;
    }
    
    PyObject
* args = PyTuple_New(1);
    PyTuple_SetItem(args,
0,Py_BuildValue("s","List.htm"));
    PyObject
* value = PyObject_CallObject(pFunc,args);
    
int ret = PySequence_Check(value);
    printf(
"check:%d\n",ret);
    
int length = PySequence_Size(value);
    printf(
"length:%d\n",length);
    
    
int i = 0;
    
for(;i<length;i++)
    {
        PyObject
* obj = PySequence_GetItem(value,i);  
        
//char* str = PyBytes_AS_STRING(obj);
        char* str = GDALPythonObjectToCStr(obj);
        printf(
"link:%s\n",str);    
        free(str);
    }
    
    Py_DECREF(args);
    Py_DECREF(pModule);
    Py_Finalize();    
    system(
"PAUSE");    
    
return 0;
}

/* Return a NULL terminated c String from a PyObject */
/* Result must be freed with GDALPythonFreeCStr */
char* GDALPythonObjectToCStr(PyObject* pyObject)
{
#if PY_VERSION_HEX >= 0x03000000
    
if(PyUnicode_Check(pyObject))
    {
        
char *pszStr;
        
char *pszNewStr;
        Py_ssize_t nLen;
        PyObject
* pyUTF8Str = PyUnicode_AsUTF8String(pyObject);
        PyBytes_AsStringAndSize(pyUTF8Str,
&pszStr,&nLen);
        pszNewStr 
= (char*)malloc(nLen+1);
        memcpy(pszNewStr,pszStr,nLen
+1);
        Py_XDECREF(pyUTF8Str);
        
return pszNewStr;
    }
    
else if(PyBytes_Check(pyObject))
    {
        
char *pszStr;
        
char *pszNewStr;
        Py_ssize_t nLen;
        PyBytes_AsStringAndSize(pyObject,
&pszStr,&nLen);
        pszNewStr 
= (char*)malloc(nLen+1);
        memcpy(pszNewStr,pszStr,nLen
+1);
        
return pszNewStr;
    }
    
else
    {
        
char *pszStr = (char*)malloc(1);
        pszStr[
0= '\0';
        
return pszStr;
    }
#else
    
return PyString_AsString(pyObject);
#endif
}


ccsdu2009 2013-12-07 15:48 鍙戣〃璇勮
]]>
浣跨敤Beautiful Soup 瑙f瀽html鏂囨。http://www.shnenglu.com/gaimor/archive/2013/12/07/204645.htmlccsdu2009ccsdu2009Sat, 07 Dec 2013 03:17:00 GMThttp://www.shnenglu.com/gaimor/archive/2013/12/07/204645.htmlhttp://www.shnenglu.com/gaimor/comments/204645.htmlhttp://www.shnenglu.com/gaimor/archive/2013/12/07/204645.html#Feedback0http://www.shnenglu.com/gaimor/comments/commentRss/204645.htmlhttp://www.shnenglu.com/gaimor/services/trackbacks/204645.html灝辨嬁瑙f瀽html鏉ヨ錛屼嬌鐢?Beautiful Soup 灝辨瘮浣跨敤libtidy鏂逛究寰堝 - 褰撶劧涔熸湁鍙兘鏄?div>Beautiful Soup灝佽鐨勫緢鍘夊鍚?br />
浣跨敤Beautiful Soup鐨勪竴涓緥瀛愬涓?
from bs4 import BeautifulSoup

soup 
= BeautifulSoup(open('List.htm'))
for a in soup.find_all('a',class_ = 'link'):
    
print (a.get('href'))
鐩殑鏄壘鍑篽tml涓璫lass灞炴т負link鐨刟鑺傜偣瀵瑰簲鐨刪ref灞炴у瓧絎︿覆
濡傛灉鏄嬌鐢╟++ libtidy鐨勮瘽
瀵瑰簲鐨勪唬鐮佸涓?
Bool TIDY_CALL tidyFilterCb(TidyDoc tdoc,TidyReportLevel lvl,uint line,uint col,ctmbstr mssg)
{  
    
return no;
}

void extractContent(TidyNode node,TidyDoc doc);

void parseContent(TidyNode node,TidyDoc doc)
{   
    TidyNode child;
    
for(child = tidyGetChild(node);child;child = tidyGetNext(child))
    {   
        
if(tidyNodeIsA(child))                    
            extractContent(child,doc);
        
else
            parseContent(child,doc);     
    }
}

void extractContent(TidyNode node,TidyDoc doc)
{   
    
if(yes == tidyNodeIsA(node))
    {   
        TidyAttr cls 
= tidyAttrGetCLASS(node);
        
if(cls != NULL)
        {   
            
char* value = (char*)tidyAttrValue(cls);
            
if(!strcmp(value,"link"))
            {   
                TidyAttr href 
= tidyAttrGetHREF(node);   
                
if(href != NULL)
                {
                    
char* link = (char*)tidyAttrValue(href);
                    printf(
"link:%s\n",link);
                    
return;
                }
            }
        } 
    }   
    parseContent(node,doc);
}

void tidyParseHtml(char* file)
{
    TidyDoc doc 
= tidyCreate();
    tidySetReportFilter(doc,tidyFilterCb);
    tidyParseFile(doc,file);
    TidyNode body 
= tidyGetBody(doc);
    TidyNode child;
    
for(child = tidyGetChild(body);child;child = tidyGetNext(child))
    {   
        parseContent(child,doc);
    }    
    tidyRelease(doc); 
}
榪樻槸寰堝暟鍡︾殑

褰撶劧涓嬮潰鐨刾ython浠g爜涔熻兘瀹屾垚浠誨姟:
from bs4 import BeautifulSoup

soup 
= BeautifulSoup(open('List.htm'))
list 
= soup.select('a[class="link"]')
for a in list:
    
if a.has_attr('href'):
        print (a.
get('href'))
濡傛灉鎯沖垎鏋愮綉欏墊垜瑙夊緱BeatifulSoup緇濆鏄竴涓埄鍣?br />閾炬帴:
http://www.crummy.com/software/BeautifulSoup/bs4/doc/


ccsdu2009 2013-12-07 11:17 鍙戣〃璇勮
]]>
中文字幕一区二区三区久久网站| 国产精品99久久久精品无码| 久久精品国产亚洲网站| 国产99精品久久| 久久久久久久久久久免费精品| 成人综合久久精品色婷婷| 亚洲国产欧洲综合997久久| 国产一级持黄大片99久久| 久久免费视频一区| 一本色道久久88精品综合| 91秦先生久久久久久久| 99久久综合国产精品免费| 国产精品久久久久aaaa| 亚洲欧美日韩精品久久亚洲区| 久久99精品国产麻豆| 亚洲精品NV久久久久久久久久 | 精品国产日韩久久亚洲| 精品乱码久久久久久久| 久久精品极品盛宴观看| 久久综合给合综合久久| 久久精品国产一区| 欧洲精品久久久av无码电影 | 亚洲欧美日韩中文久久| 国产成人精品久久亚洲高清不卡 | 亚洲成色WWW久久网站| 蜜桃麻豆www久久国产精品| 91久久香蕉国产熟女线看| 久久66热人妻偷产精品9| 99精品国产综合久久久久五月天 | 一本色道久久88加勒比—综合| 人妻无码精品久久亚瑟影视| 天天做夜夜做久久做狠狠| 99久久精品这里只有精品| 久久99国产精品二区不卡| 久久婷婷五月综合色奶水99啪| 伊人久久大香线蕉综合Av| 精品国产99久久久久久麻豆| 7777久久久国产精品消防器材 | 国内精品久久久久久麻豆| 国产 亚洲 欧美 另类 久久| 久久国产精品二国产精品|