mirror of
https://github.com/PredatH0r/ChanSort.git
synced 2026-02-20 05:16:45 +01:00
decoding of Panasonic channel names with auto-detection of code page and support for mixed-in UTF-8 sequences
This commit is contained in:
@@ -52,6 +52,8 @@ namespace ChanSort.Api
|
||||
this.FavIndex = new List<int>(MAX_FAV_LISTS);
|
||||
for (int i = 0; i < MAX_FAV_LISTS; i++)
|
||||
this.FavIndex.Add(-1);
|
||||
this.Name = "";
|
||||
this.ShortName = "";
|
||||
}
|
||||
|
||||
/// <summary>
|
||||
|
||||
@@ -1,4 +1,5 @@
|
||||
using System.Collections.Generic;
|
||||
using System;
|
||||
using System.Collections.Generic;
|
||||
using System.Data.SQLite;
|
||||
using System.Text;
|
||||
using ChanSort.Api;
|
||||
@@ -8,9 +9,10 @@ namespace ChanSort.Loader.Panasonic
|
||||
internal class DbChannel : ChannelInfo
|
||||
{
|
||||
internal int Bits;
|
||||
internal byte[] RawName;
|
||||
|
||||
#region ctor()
|
||||
internal DbChannel(SQLiteDataReader r, IDictionary<string, int> field, DataRoot dataRoot)
|
||||
internal DbChannel(SQLiteDataReader r, IDictionary<string, int> field, DataRoot dataRoot, Encoding encoding)
|
||||
{
|
||||
this.RecordIndex = r.GetInt32(field["rowid"]);
|
||||
this.RecordOrder = r.GetInt32(field["major_channel"]);
|
||||
@@ -39,6 +41,7 @@ namespace ChanSort.Loader.Panasonic
|
||||
this.Encrypted = r.GetInt32(field["free_CA_mode"]) != 0;
|
||||
this.Lock = r.GetInt32(field["child_lock"]) != 0;
|
||||
this.ParseFavorites(r, field);
|
||||
this.ReadNamesWithEncodingDetection(r, field, encoding);
|
||||
|
||||
if (ntype == 10 || ntype == 14)
|
||||
this.ReadAnalogData(r, field);
|
||||
@@ -63,21 +66,17 @@ namespace ChanSort.Loader.Panasonic
|
||||
}
|
||||
#endregion
|
||||
|
||||
#region ReadAnalogData()
|
||||
private void ReadAnalogData(SQLiteDataReader r, IDictionary<string, int> field)
|
||||
{
|
||||
this.Name = r.GetString(field["sname"]);
|
||||
this.FreqInMhz = r.IsDBNull(field["freq"]) ? 0 : (decimal)r.GetInt32(field["freq"]) / 1000;
|
||||
this.ChannelOrTransponder = Tools.GetAnalogChannelNumber((int)this.FreqInMhz);
|
||||
}
|
||||
#endregion
|
||||
|
||||
#region ReadDvbData()
|
||||
protected void ReadDvbData(SQLiteDataReader r, IDictionary<string, int> field, DataRoot dataRoot, byte[] delivery)
|
||||
{
|
||||
string longName, shortName;
|
||||
this.GetChannelNames(r.GetString(field["sname"]), out longName, out shortName);
|
||||
this.Name = longName;
|
||||
this.ShortName = shortName;
|
||||
|
||||
int stype = r.GetInt32(field["stype"]);
|
||||
this.SignalSource |= LookupData.Instance.IsRadioOrTv(stype);
|
||||
this.ServiceType = stype;
|
||||
@@ -115,30 +114,113 @@ namespace ChanSort.Loader.Panasonic
|
||||
}
|
||||
#endregion
|
||||
|
||||
#region ReadNamesWithEncodingDetection()
|
||||
/// <summary>
|
||||
/// Character encoding is a mess here. Code pages mixed with UTF-8 and raw data
|
||||
/// </summary>
|
||||
private void ReadNamesWithEncodingDetection(SQLiteDataReader r, IDictionary<string, int> field, Encoding encoding)
|
||||
{
|
||||
byte[] buffer = new byte[100];
|
||||
int len = (int)r.GetBytes(field["sname"], 0, buffer, 0, buffer.Length);
|
||||
int end = Array.IndexOf<byte>(buffer, 0, 0, len);
|
||||
if (end >= 0)
|
||||
len = end;
|
||||
this.RawName = new byte[len];
|
||||
Array.Copy(buffer, 0, this.RawName, 0, len);
|
||||
this.ChangeEncoding(encoding);
|
||||
}
|
||||
#endregion
|
||||
|
||||
#region ChangeEncoding()
|
||||
public override void ChangeEncoding(Encoding encoding)
|
||||
{
|
||||
// the encoding of channel names is a complete mess:
|
||||
// it can be UTF-8
|
||||
// it can be as specified by the DVB-encoding with a valid code page selector byte
|
||||
// it can have a DVB-encoded code page selector, but ignores the CP and use UTF-8 regardless
|
||||
// it can be code page encoded without any clue to what the code page is
|
||||
// it can have DVB-control characters inside an UTF-8 stream
|
||||
|
||||
if (RawName.Length == 0)
|
||||
return;
|
||||
|
||||
int startOffset;
|
||||
int bytesPerChar;
|
||||
if (!GetRecommendedEncoding(ref encoding, out startOffset, out bytesPerChar))
|
||||
return;
|
||||
|
||||
// single byte code pages might have UTF-8 code mixed in, so we have to parse it manually
|
||||
StringBuilder sb = new StringBuilder();
|
||||
for (int i = startOffset; i < this.RawName.Length; i+=bytesPerChar)
|
||||
{
|
||||
byte c = this.RawName[i];
|
||||
byte c2 = i + 1 < this.RawName.Length ? this.RawName[i + 1] : (byte)0;
|
||||
if (c < 0xA0)
|
||||
sb.Append((char)c);
|
||||
else if (bytesPerChar == 1 && c >= 0xC0 && c <= 0xDF && c2 >= 0x80 && c2 <= 0xBF) // 2 byte UTF-8
|
||||
{
|
||||
sb.Append((char)(((c & 0x1F) << 6) | (c2 & 0x3F)));
|
||||
++i;
|
||||
}
|
||||
else
|
||||
sb.Append(encoding.GetString(this.RawName, i, bytesPerChar));
|
||||
}
|
||||
|
||||
string longName, shortName;
|
||||
this.GetChannelNames(sb.ToString(), out longName, out shortName);
|
||||
this.Name = longName;
|
||||
this.ShortName = shortName;
|
||||
}
|
||||
#endregion
|
||||
|
||||
#region GetRecommendedEncoding()
|
||||
private bool GetRecommendedEncoding(ref Encoding encoding, out int startOffset, out int bytesPerChar)
|
||||
{
|
||||
startOffset = 0;
|
||||
bytesPerChar = 1;
|
||||
if (RawName[0] < 0x10) // single byte character sets
|
||||
{
|
||||
encoding = DvbStringDecoder.GetEncoding(RawName[0]);
|
||||
startOffset = 1;
|
||||
}
|
||||
else if (RawName[0] == 0x10) // prefix for 16 bit code page ID with single byte character sets
|
||||
{
|
||||
if (RawName.Length < 3) return false;
|
||||
encoding = DvbStringDecoder.GetEncoding(0x100000 + RawName[1]*256 + RawName[2]);
|
||||
startOffset = 3;
|
||||
}
|
||||
else if (RawName[0] == 0x15) // UTF-8
|
||||
{
|
||||
encoding = Encoding.UTF8;
|
||||
startOffset = 1;
|
||||
}
|
||||
else if (RawName[0] < 0x20) // various 2-byte character sets
|
||||
{
|
||||
encoding = DvbStringDecoder.GetEncoding(RawName[0]);
|
||||
startOffset = 1;
|
||||
bytesPerChar = 2;
|
||||
}
|
||||
return true;
|
||||
}
|
||||
|
||||
#endregion
|
||||
|
||||
#region GetChannelNames()
|
||||
private void GetChannelNames(string name, out string longName, out string shortName)
|
||||
{
|
||||
StringBuilder sbLong = new StringBuilder();
|
||||
StringBuilder sbShort = new StringBuilder();
|
||||
|
||||
#if false
|
||||
//Encoding encoding = Encoding.Default;
|
||||
if (name.Length > 0 && name[0] < 0x20)
|
||||
{
|
||||
if (name.Length >= 3 && name[0] == 0x10)
|
||||
encoding = DvbStringDecoder.GetEncoding(name[0]);
|
||||
}
|
||||
#endif
|
||||
bool inShort = false;
|
||||
foreach (char c in name)
|
||||
{
|
||||
if (c < 0x20)
|
||||
continue;
|
||||
if (c == 0x86)
|
||||
if (c == 0x86 || c == '\uE086')
|
||||
inShort = true;
|
||||
else if (c == 0x87)
|
||||
else if (c == 0x87 || c == '\uE087')
|
||||
inShort = false;
|
||||
if (c >= 0x80 && c <= 0x9F)
|
||||
if (c >= 0x80 && c <= 0x9F || c>='\uE080' && c<='\uE09F')
|
||||
continue;
|
||||
|
||||
if (inShort)
|
||||
@@ -151,11 +233,13 @@ namespace ChanSort.Loader.Panasonic
|
||||
}
|
||||
#endregion
|
||||
|
||||
|
||||
#region UpdateRawData()
|
||||
public override void UpdateRawData()
|
||||
{
|
||||
|
||||
|
||||
}
|
||||
#endregion
|
||||
|
||||
}
|
||||
}
|
||||
|
||||
@@ -498,7 +498,7 @@ namespace ChanSort.Loader.Panasonic
|
||||
"profile1index","profile2index","profile3index","profile4index","stype", "onid", "tsid", "sid", "ntype", "ya_svcid", "delivery" };
|
||||
|
||||
const string sql = @"
|
||||
select s.rowid,s.major_channel,s.physical_ch,s.sname,t.freq,s.skip,s.running_status,s.free_CA_mode,s.child_lock,
|
||||
select s.rowid,s.major_channel,s.physical_ch,cast(s.sname as blob),t.freq,s.skip,s.running_status,s.free_CA_mode,s.child_lock,
|
||||
profile1index,profile2index,profile3index,profile4index,s.stype,s.onid,s.tsid,s.svcid,s.ntype,s.ya_svcid,delivery
|
||||
from SVL s
|
||||
left outer join TSL t on s.ntype=t.ntype and s.physical_ch=t.physical_ch and s.tsid=t.tsid
|
||||
@@ -512,7 +512,7 @@ order by s.ntype,major_channel
|
||||
{
|
||||
while (r.Read())
|
||||
{
|
||||
ChannelInfo channel = new DbChannel(r, fields, this.DataRoot);
|
||||
ChannelInfo channel = new DbChannel(r, fields, this.DataRoot, this.DefaultEncoding);
|
||||
if (!channel.IsDeleted)
|
||||
{
|
||||
var channelList = this.DataRoot.GetChannelList(channel.SignalSource);
|
||||
@@ -534,6 +534,21 @@ order by s.ntype,major_channel
|
||||
}
|
||||
#endregion
|
||||
|
||||
#region DefaultEncoding
|
||||
public override Encoding DefaultEncoding
|
||||
{
|
||||
get { return base.DefaultEncoding; }
|
||||
set
|
||||
{
|
||||
base.DefaultEncoding = value;
|
||||
foreach (var list in this.DataRoot.ChannelLists)
|
||||
{
|
||||
foreach(var channel in list.Channels)
|
||||
channel.ChangeEncoding(value);
|
||||
}
|
||||
}
|
||||
}
|
||||
#endregion
|
||||
|
||||
|
||||
#region Save()
|
||||
@@ -579,7 +594,7 @@ order by s.ntype,major_channel
|
||||
cmd.Parameters.Add(new SQLiteParameter("@lock", DbType.Int32));
|
||||
cmd.Parameters.Add(new SQLiteParameter("@skip", DbType.Int32));
|
||||
cmd.Prepare();
|
||||
foreach (ChannelInfo channel in channelList.Channels)
|
||||
foreach (DbChannel channel in channelList.Channels)
|
||||
{
|
||||
if (channel.NewProgramNr < 0 || channel.OldProgramNr < 0)
|
||||
continue;
|
||||
@@ -588,7 +603,7 @@ order by s.ntype,major_channel
|
||||
cmd.Parameters["@progNr"].Value = channel.NewProgramNr;
|
||||
for (int fav = 0; fav < 4; fav++)
|
||||
cmd.Parameters["@fav" + (fav + 1)].Value = Math.Max(0, channel.FavIndex[fav]);
|
||||
cmd.Parameters["@name"].Value = channel.Name;
|
||||
cmd.Parameters["@name"].Value = channel.RawName;
|
||||
cmd.Parameters["@lock"].Value = channel.Lock;
|
||||
cmd.Parameters["@skip"].Value = channel.Skip;
|
||||
cmd.ExecuteNonQuery();
|
||||
@@ -654,6 +669,7 @@ order by s.ntype,major_channel
|
||||
}
|
||||
#endregion
|
||||
|
||||
#region GetFileInformation()
|
||||
public override string GetFileInformation()
|
||||
{
|
||||
StringBuilder sb = new StringBuilder();
|
||||
@@ -673,5 +689,6 @@ order by s.ntype,major_channel
|
||||
sb.Append("Character encoding: ").AppendLine(this.charEncoding);
|
||||
return sb.ToString();
|
||||
}
|
||||
#endregion
|
||||
}
|
||||
}
|
||||
|
||||
@@ -25,9 +25,9 @@ namespace ChanSort.Ui
|
||||
{
|
||||
public partial class MainForm : XtraForm
|
||||
{
|
||||
public const string AppVersion = "v2013-11-16";
|
||||
public const string AppVersion = "v2013-11-20";
|
||||
|
||||
private const int MaxMruEntries = 5;
|
||||
private const int MaxMruEntries = 8;
|
||||
|
||||
#region enum EditMode
|
||||
private enum EditMode
|
||||
|
||||
24
readme.txt
24
readme.txt
@@ -1,20 +1,9 @@
|
||||
Version v2013-11-16 =======================================================
|
||||
Version v2013-11-20 =======================================================
|
||||
|
||||
Changes:
|
||||
- Loading a .csv reference list now also changes the channel names. This
|
||||
way analog channel names can be restored after a new channel scan
|
||||
- FIX: changes to Samsung channel lists after the first "save file"
|
||||
operation were lost. Only the first save operation worked as expected.
|
||||
- FIX: dragging something (e.g. a file) from outside ChanSort over one of
|
||||
its tables causes an error
|
||||
- FIX: channels in Samsung B-series DVB-C/T channel lists were incorrectly
|
||||
identified and marked as deleted/active, resulting in duplicate program
|
||||
numbers on the TV.
|
||||
- FIX: channel names in Samsung lists sometimes showed "..." after the end
|
||||
- Experimental support for modifying LG channel lists with predefined
|
||||
channel numbers (LCN)
|
||||
- Backed-out some changes from 2013-11-09 which may have caused incorrect
|
||||
handling of deleted channels in Samsung channel lists
|
||||
- Panasonic: Handling of special characters in channel names
|
||||
- Toshiba: channels didn't change their order for zapping in .zip/chmgt.db
|
||||
channel lists (thanks to Kurt W. for the hint)
|
||||
|
||||
The complete change log can be found at the end of this document
|
||||
|
||||
@@ -123,6 +112,11 @@ OTHER DEALINGS IN THE SOFTWARE.
|
||||
|
||||
Change log ================================================================
|
||||
|
||||
2013-11-20
|
||||
- Panasonic: Handling of special characters in channel names
|
||||
- Toshiba: channels didn't change their order for zapping in .zip/chmgt.db
|
||||
channel lists (thanks to Kurt W. for the hint)
|
||||
|
||||
2013-11-16
|
||||
- FIX: changes to Samsung channel lists after the first "save file"
|
||||
operation were lost. Only the first save operation worked as expected.
|
||||
|
||||
Reference in New Issue
Block a user