C#逐行解析文本数据

问题描述

| 我的项目有问题,在这里让我解释一下,在这里我需要一些专家指导,因为我是编程新手。 我在记事本中有这样的数据:
10192 20351 30473 40499 50449 60234    
10192 20207 30206 40203 50205 60226    
10192 20252 30312 40376 50334 60252
它是26行数据,但是我仅显示3行。以下是按优先级排序的一些规则: -我只想阅读文本文件,然后提取数字。示例:10192 20351等。 -我有6列ListView,我想在它的列中显示每一行数字   第1栏|第2栏|第3列|第4列|第5栏|第6栏
10192   | 20351   | 30473  | 40499  |50449  | 60234
当然,如果可能的话,每5位数的前2位数是一个唯一的代码,我只希望最后3位数。例如:192 351 473 499 499234。因此每个数字将修改为10.000。 我想我让很多人感到困惑,对不起,这是我当前的代码 私人委托void UpdateUiTextDelegate(String Text);         私有无效serial_DataRecieved(对象发送者,System.IO.Ports.SerialDataReceivedEventArgs e)         {             //将收到的字符收集到我们的\'buffer \'(字符串)中。             字符串接收到的数据;             receive_data = serial.ReadExisting();             dispatcher.Invoke(dispatcherPriority.Send,新的UpdateUiTextDelegate(WriteData),received_data);         }
    private void WriteData(String Text)
    {
        if (bufferData != \"\" || Text[0] == \'1\')
            bufferData += Text;
        if (bufferData.Length >= 35)
        {
            using (System.IO.StreamWriter file = new System.IO.StreamWriter(@\"C:\\Users\\Rads\\Desktop\\Training06.txt\",true))
            {
                file.WriteLine(bufferData);
            }
            listBox1.Items.Add(bufferData);
            bufferData = \"\";
        }
    }
    #endregion

    private void Window_Loaded(object sender,RoutedEventArgs e)
    {

    }

    //browse .txt file
    private void browse_btn_Click(object sender,RoutedEventArgs e)
    {
        Microsoft.Win32.OpenFileDialog dlg = new Microsoft.Win32.OpenFileDialog();

        dlg.DefaultExt = \".txt\";
        dlg.Filter = \"Text document (.txt)|*.txt\";

        Nullable<bool> result = dlg.ShowDialog();

        if (result == true)
        {
            string filename = dlg.FileName;
            textBox.Text = filename;
        }
    }

    private void Parsing_String(string filename)
    {
        List<Row> list = new List<Row>();

        foreach (String str in File.ReadLines(filename))
        {
            String[] strCols = str.Split(Convert.tochar(\" \"));
            list.Add(new Row()
            {
                Column1 = strCols[0].Substring(2),Column2 = strCols[1].Substring(2),Column3 = strCols[2].Substring(2),Column4 = strCols[3].Substring(2),Column5 = strCols[4].Substring(2),Column6 = strCols[5].Substring(2),});
        }

        dg.ItemsSource = list;
    }

    public class Row
    {
        public string Column1 { get; set; }
        public string Column2 { get; set; }
        public string Column3 { get; set; }
        public string Column4 { get; set; }
        public string Column5 { get; set; }
        public string Column6 { get; set; }

    }
XAML代码
<Window x:Class=\"SamplingData.MainWindow\"
    xmlns=\"http://schemas.microsoft.com/winfx/2006/xaml/presentation\"
    xmlns:x=\"http://schemas.microsoft.com/winfx/2006/xaml\"
    Title=\"MainWindow\" Height=\"368\" Width=\"401\" Loaded=\"Window_Loaded\">

<TabControl Height=\"332\" HorizontalAlignment=\"Left\" Name=\"tabControl1\" VerticalAlignment=\"Top\" Width=\"380\">
    <TabItem Header=\"Sampling\" Name=\"Sampling\">
        <Grid>
            <Label Content=\"DATA RECEIVED\" Height=\"28\" HorizontalAlignment=\"Left\" Margin=\"6,6,0\" Name=\"label1\" VerticalAlignment=\"Top\" />
            <Button Content=\"Connect\" Height=\"23\" HorizontalAlignment=\"Left\" Margin=\"264,0\" Name=\"ConnectButton\" VerticalAlignment=\"Top\" Width=\"75\" Click=\"Connect_Comms\" />
            <ListBox Height=\"222\" HorizontalAlignment=\"Left\" Margin=\"10,37,0\" Name=\"listBox1\" VerticalAlignment=\"Top\" Width=\"329\" />
        </Grid>
    </TabItem>
    <TabItem Header=\"Training\" Name=\"tabItem1\">
        <Grid>
            <Button Content=\"Training\" Height=\"23\" HorizontalAlignment=\"Left\" Margin=\"243,28,0\" Name=\"Train_Btn\" VerticalAlignment=\"Top\" Width=\"75\" />
            <Button Content=\"browse\" Height=\"23\" HorizontalAlignment=\"Left\" Margin=\"243,0\" Name=\"browse_btn\" VerticalAlignment=\"Top\" Width=\"75\" Click=\"browse_btn_Click\" />
            <TextBox Height=\"23\" HorizontalAlignment=\"Left\" Margin=\"6,7,0\" Name=\"textBox\" VerticalAlignment=\"Top\" Width=\"231\" Background=\"{x:Null}\"></TextBox>
            <RadioButton Content=\"RadioButton\" Height=\"16\" HorizontalAlignment=\"Left\" Margin=\"507,76,0\" Name=\"radioButton1\" VerticalAlignment=\"Top\" />
            <DataGrid x:Name=\"dg\" AutoGenerateColumns=\"False\" Margin=\"0,57,0\" DataContext=\"{Binding}\">
                <DataGrid.Columns>
                    <DataGridTextColumn Binding=\"{Binding Column1}\" Header=\"Column 1\"></DataGridTextColumn>
                    <DataGridTextColumn Binding=\"{Binding Column2}\" Header=\"Column 2\"></DataGridTextColumn>
                    <DataGridTextColumn Binding=\"{Binding Column3}\" Header=\"Column 3\"></DataGridTextColumn>
                    <DataGridTextColumn Binding=\"{Binding Column4}\" Header=\"Column 4\"></DataGridTextColumn>
                    <DataGridTextColumn Binding=\"{Binding Column5}\" Header=\"Column 5\"></DataGridTextColumn>
                    <DataGridTextColumn Binding=\"{Binding Column6}\" Header=\"Column 6\"></DataGridTextColumn>
                </DataGrid.Columns>
            </DataGrid>
        </Grid>
    </TabItem>
</TabControl>
非常感谢有人可以帮助我。     

解决方法

编辑:按照Ash的建议添加了Row变量: 假设您没有指定要向哪个对象写入数据,我假设它是一个名为Row的数据行:
private void Parsing_String(string filename)    
{
    DataTable dt = CreateDataTable();
    foreach (String str in File.ReadLines(filename))
    {
      String[] strCols = str.Split(Convert.ToChar(\" \"));
      DataRow Row = dt.NewRow(); //Where dt is a DataTable
      for (int i =0; i < strCols.length; i++)
      {
           Row[i] = strCols[i].Substring(2); //This will start reading from the third character
      }
      dt.Rows.Add(Row);
     }
      listView1.ItemsSource = dt.Rows;
}

//**EDIT**: Just in case you don\'t have a datatable and you want to create a small one:

public DataTable CreateDataTable()
    {
        DataTable dt = new DataTable();

        new string[] { \"Column 1\",\"Column 2\",\"Column 3\",\"Column 4\",\"Column 5\",\"Column 6\" }
            .ToList()
            .ForEach(c => { dt.Columns.Add(new DataColumn(c)); });
        return dt;
    }
编辑:最后尝试(忽略上面的代码):
    private void Parsing_String(string filename)
    {
        List<Row> list = new List<Row>();

        foreach (String str in File.ReadLines(filename))
        {
            String[] strCols = str.Split(Convert.ToChar(\" \"));
            list.Add(new Row() 
            {
                Column1 = strCols[0].Substring(2),Column2 = strCols[1].Substring(2),Column3 = strCols[2].Substring(2),Column4 = strCols[3].Substring(2),Column5 = strCols[4].Substring(2),Column6 = strCols[5].Substring(2)
            });
        }

        dg.ItemsSource = list;
    }

    public class Row
    {
        public string Column1 { get; set; }
        public string Column2 { get; set; }
        public string Column3 { get; set; }
        public string Column4 { get; set; }
        public string Column5 { get; set; }
        public string Column6 { get; set; }
    }
然后在您的xaml中:      如果要指定自定义标头,则必须对其进行更改,以便它不会自动生成列,而是使用绑定,即:
   <DataGrid x:Name=\"dg\" AutoGenerateColumns=\"False\">
        <DataGrid.Columns>
            <DataGridTextColumn Binding=\"{Binding Column1}\" Header=\"Column 1\"></DataGridTextColumn>
            <DataGridTextColumn Binding=\"{Binding Column2}\" Header=\"Column 2\"></DataGridTextColumn>
            <DataGridTextColumn Binding=\"{Binding Column3}\" Header=\"Column 3\"></DataGridTextColumn>
            <DataGridTextColumn Binding=\"{Binding Column4}\" Header=\"Column 4\"></DataGridTextColumn>
            <DataGridTextColumn Binding=\"{Binding Column5}\" Header=\"Column 5\"></DataGridTextColumn>
            <DataGridTextColumn Binding=\"{Binding Column6}\" Header=\"Column 6\"></DataGridTextColumn>
        </DataGrid.Columns>
    </DataGrid>
编辑这将计算第一列总计
protected int CalculateFirstColumnTotal(List<Row> list)
{
    int total = 0;
    foreach (Row row in list)
      total += int.Parse(row.Column1);
}
编辑: 您实际上从未调用过Parsing_String方法,将以下行添加到browser方法:
private void Browse_btn_Click(object sender,RoutedEventArgs e)    
{
    //Existing Code
    Parsing_String(textBox.Text);  //Add this line to the last line of the method.
}
    ,我认为您根本不需要Regex。您只需要string.Line按行和空格分隔。
string[] lines = data.Split(Enviroment.NewLine);
对于每一行,可以通过按行将行分开来获取字段。
string[] fields = line.Split(\' \');
    ,大概是这样的:
var result = from row in theFileAsString.Split(\'\\n\')
             select new {
                Columns = row.Split(\' \').Select(s => s.Substring(2))
             }
在那里,您将拥有一个
IEnumerable
,其中每个项目的属性
Columns
都包含带有数据的字符串。 虽然未经测试,但您知道了。     ,好的,这可能是矫kill过正,但是您提到要将数据放入列表视图(也许是数据网格?),在这种情况下,您可能希望将数据转换为某种对象形式。实际上,这取决于获得数据后实际要处理的数据。 假设您一旦掌握了数据,便会想要对其进行操作或进行其他操作,然后尝试类似的操作-您应该能够将其直接放入新的控制台应用程序中并运行它。
namespace ConsoleApplication6
{
    using System;
    using System.Collections.Generic;
    using System.IO;
    using System.Text.RegularExpressions;

    class Program
    {
        static void Main(string[] args)
        {
            string filename = @\"c:\\test.txt\";

            // Because you\'re working with a small file,we\'ll just read all the lines into memory
            List<LineData> processedLines = new List<LineData>();
            foreach (var line in File.ReadAllLines(filename))
            {
                processedLines.Add(new LineData(line));
            }

            // Write out the line data to the console to prove that it has been read
            foreach (var processedLine in processedLines)
            {
                Console.WriteLine(
                    \"{0},{1},{2},{3},{4},{5}\",processedLine.Column1,processedLine.Column2,processedLine.Column3,processedLine.Column4,processedLine.Column5,processedLine.Column6);
            }
        }
    }

    public class LineData
    {
        public LineData(string line)
        {
            // Regex basically means find two digits (\"Prefix\") followed by 3 digits (\"Value\")
            Regex regex = new Regex(@\"(?<Prefix>\\d{2})(?<Value>\\d{3})\");
            var lineMatches = regex.Matches(line);
            if (lineMatches.Count != 6)
            {
                // You should really be throwing your own exception type...
                throw new Exception(\"Expected 6 columns!\");
            }

            this.Column1 = this.ExtractMatchData(lineMatches[0]);
            this.Column2 = this.ExtractMatchData(lineMatches[1]);
            this.Column3 = this.ExtractMatchData(lineMatches[2]);
            this.Column4 = this.ExtractMatchData(lineMatches[3]);
            this.Column5 = this.ExtractMatchData(lineMatches[4]);
            this.Column6 = this.ExtractMatchData(lineMatches[5]);
        }

        private string ExtractMatchData(Match match)
        {
            return match.Groups[\"Value\"].Value;
        }

        public string Column1 { get; set; }
        public string Column2 { get; set; }
        public string Column3 { get; set; }
        public string Column4 { get; set; }
        public string Column5 { get; set; }
        public string Column6 { get; set; }
    }
}
    ,
using (var stream = File.Open(this.filename,FileMode.Open,FileAccess.Read)
{
    var reader = new StreamReader(stream);
    var data = reader.ReadLine();
    while (!String.IsNullOrWhitespace(data))
    {
        string[] columns = data.Split(\' \');
        Console.WriteLine(string.Format(\"{0} {1} {2} {3} {4} {5}\",columns[0],columns[1],));
        data = reader.ReadLine();
    }
}
    ,您不必为此使用正则表达式。
var data = @\"10192 20351 30473 40499 50449 60234
10192 20207 30206 40203 50205 60226
10192 20252 30312 40376 50334 60252\";

var result = from line in data.Split(new[] { \"\\r\\n\",\"\\n\" },StringSplitOptions.RemoveEmptyEntries)
             let splitted = line.Split(new[] {\' \'},StringSplitOptions.RemoveEmptyEntries)
             select splitted.Select(s => s.Substring(2));
或文件
using System.IO; // In the top

var result = from line in File.ReadLines(\"path\")
             let splitted = line.Split(new[] {\' \'},StringSplitOptions.RemoveEmptyEntries)
             select splitted.Select(s => s.Substring(2));
result
现在将包含一个字符串序列序列(其中前两个字符已删除)。该版本适用于Unix和Windows换行符。并且它还删除了可能导致其他答案失败的其他空格。