You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
82 lines
3.4 KiB
82 lines
3.4 KiB
using System;
|
|
using System.Collections.Generic;
|
|
using System.Linq;
|
|
using System.Text;
|
|
using System.Text.RegularExpressions;
|
|
using System.Net;
|
|
using System.Web;
|
|
using System.IO;
|
|
|
|
namespace FLocal.Importer {
|
|
public class ShallerGateway {
|
|
|
|
public static string getUserInfoAsString(string userName) {
|
|
//if(userName != HttpUtility.UrlEncode(userName, ShallerConnector.encoding)) throw new ApplicationException("'" + userName + "':showprofile.php?User=" + HttpUtility.UrlEncode(userName, ShallerConnector.encoding) + "&What=login&showlite=l");
|
|
return ShallerConnector.getPageContent("showprofile.php?User=" + HttpUtility.UrlEncode(userName, ShallerConnector.encoding) + "&What=login&showlite=l", new Dictionary<string,string>(), new System.Net.CookieContainer());
|
|
}
|
|
|
|
private static Dictionary<string, Regex> regexInfoCache = new Dictionary<string, Regex>();
|
|
private static Regex getInfoRegexByCaption(string caption) {
|
|
if(!regexInfoCache.ContainsKey(caption)) {
|
|
lock(caption) {
|
|
if(!regexInfoCache.ContainsKey(caption)) {
|
|
regexInfoCache[caption] = new Regex("<td[^>]*>\\s*" + caption + "\\s*</td>\\s*<td>\\s*([^<>]*)\\s*</td>", RegexOptions.Compiled | RegexOptions.IgnoreCase | RegexOptions.Multiline);
|
|
}
|
|
}
|
|
}
|
|
return regexInfoCache[caption];
|
|
}
|
|
|
|
private static Regex avatarRegex = new Regex("<img\\s+src=\"/user/(\\d+\\.\\w+)\"\\s+alt=\"Picture\"\\s+width=\"\\d+\"\\s+height=\"\\d+\"\\s*/>", RegexOptions.Compiled | RegexOptions.IgnoreCase | RegexOptions.Multiline);
|
|
|
|
private static Dictionary<string, string> userImportStructure {
|
|
get {
|
|
return new Dictionary<string,string>() {
|
|
{ "regDate", "Дата\\s+регистрации" },
|
|
{ "signature", "Подпись" },
|
|
{ "title", "Титул" },
|
|
{ "location", "Расположение" },
|
|
{ "biography", "Биография" },
|
|
};
|
|
}
|
|
}
|
|
|
|
public static Dictionary<string, string> getUserInfo(string userName) {
|
|
string content = getUserInfoAsString(userName);
|
|
Dictionary<string, string> result = userImportStructure.ToDictionary<KeyValuePair<string, string>, string, string>(
|
|
kvp => kvp.Key,
|
|
kvp => HttpUtility.HtmlDecode(getInfoRegexByCaption(kvp.Value).Match(content).Groups[1].Value).Trim()
|
|
);
|
|
result["avatar"] = avatarRegex.Match(content).Groups[1].Value;
|
|
return result;
|
|
}
|
|
|
|
public static IEnumerable<string> getUserNames(int pageNum) {
|
|
string content = ShallerConnector.getPageContent("showmembers.php?Cat=&sb=13&page=" + pageNum + "&showlite=l", new Dictionary<string,string>(), new System.Net.CookieContainer());
|
|
Regex matcher = new Regex(";User=([^&]+)&", RegexOptions.Compiled | RegexOptions.Multiline | RegexOptions.IgnoreCase);
|
|
MatchCollection matches = matcher.Matches(content);
|
|
HashSet<string> result = new HashSet<string>();
|
|
foreach(Match match in matches) {
|
|
result.Add(HttpUtility.UrlDecode(match.Groups[1].Value, ShallerConnector.encoding).Trim());
|
|
}
|
|
return result;
|
|
}
|
|
|
|
private static FileInfo getFileInfo(string path, int attempt) {
|
|
try {
|
|
return ShallerConnector.getPageInfo(path, new Dictionary<string,string>(), new CookieContainer());
|
|
} catch(Exception) {
|
|
if(attempt > 3) {
|
|
throw;
|
|
} else {
|
|
return getFileInfo(path, attempt + 1);
|
|
}
|
|
}
|
|
}
|
|
|
|
public static FileInfo getFileInfo(string path) {
|
|
return getFileInfo(path, 1);
|
|
}
|
|
|
|
}
|
|
}
|
|
|