资料来源:网络整理
时间:2023/2/14 0:38:35 共计:3633 浏览
采集爱奇艺视频地址和时长 描述等内容
view sourceprint?
public partial class Form1 : Form
|
string vidpattern = @"param\['vid'\] = ""([\d\w]+)"";" ;
|
string urlpattern = @"mod-piclist_pic_link"" href=""(http://www.iqiyi.com/(.+).html)" ;
|
string urlpattern1 = @"<a class=""site-piclist_pic_link"" href=""(http://www.iqiyi.com/(.+).html)" ;
|
string timepattern = @"sign-time-right"">([\s\S]*?)</span>" ;
|
string timepattern1 = @"<span class=""mod-listTitle_right"" rseat=""time\d+"">(.+?)</span>" ;
|
string albumIdpattern = @"albumId: ([\d]+)," ;
|
string titlepattern = @"<title>(.+)-爱奇艺</title>" ;
|
string wpattern = @"<link rel=""canonical"" href=""http://www.iqiyi.com/(.+?).html"" />" ;
|
string format = @"http://player.video.qiyi.com/{0}/0/0/{1}.swf-albumId={2}-tvId={2}-isPurchase=0-cnId=12" ;
|
private void button1_Click( object sender, EventArgs e)
|
List< string > urls = new List< string >();
|
List< string > urltime = new List< string >();
|
string html = Core.Html.GetHtml( this .textBox1.Text);
|
if (! this .checkBox1.Checked)
|
urlpattern = urlpattern1;
|
timepattern = timepattern1;
|
MatchCollection mc = Core.RegHelper.MatchToArray(html,urlpattern ,System.Text.RegularExpressions.RegexOptions.None);
|
foreach (Match item in mc)
|
if (!urls.Contains(item.Groups[1].Value.Trim()))
|
urls.Add(item.Groups[1].Value.Trim());
|
MatchCollection mct = Core.RegHelper.MatchToArray(html, timepattern, System.Text.RegularExpressions.RegexOptions.None);
|
foreach (Match item in mct)
|
if (!urltime.Contains(item.Groups[1].Value.Trim()))
|
urltime.Add(item.Groups[1].Value.Trim());
|
if (urls.Count!=urltime.Count)
|
MessageBox.Show( "时间和URL居然不对应,是否有错?" );
|
StringBuilder sb = new StringBuilder();
|
for ( int i = 0; i < urls.Count; i++)
|
string h = Core.Html.GetHtml(urls[i]);
|
string vid = Core.RegHelper.MatchToString(h,vidpattern,1,0);
|
string albumId = Core.RegHelper.MatchToString(h, albumIdpattern, 1);
|
string title = Core.RegHelper.MatchToString(h, titlepattern, 1);
|
string w = Core.RegHelper.MatchToString(h, wpattern, 1);
|
string url = string .Format(format, vid, w, albumId);
|
sb.AppendLine(urltime[i]);
|
sb.AppendLine( "\r\n\r\n" );
|
Clipboard.SetDataObject(sb.ToString());
|
MessageBox.Show( "已复制到剪贴板!" );
|
}

版权说明:
本网站凡注明“广州京杭 原创”的皆为本站原创文章,如需转载请注明出处!
本网转载皆注明出处,遵循行业规范,如发现作品内容版权或其它问题的,请与我们联系处理!
欢迎扫描右侧微信二维码与我们联系。