How do I define a concatenated column and row in a word table?

I need to read all text from a table. Using below I can read the content from the table. https://1drv.ms/w/s!Ah-Jh2Ok5SuHel9ZpB-V5DZ66DM here I have uploaded a dummy Docx file that has tables.

foreach (Word.Row row in tb.Rows)
{
    foreach (Word.Cell cell in row.Cells)
    {
        string cellText = "";
        if (cell.Range != null)
        {
            cellText = cell.Range.Text.ToString().Trim().Replace("\r\a", "");
        }
    }
} 

      

But for below 3 cases I am facing problem.

  • Case 1: Shown in Table 1, two column cells have been merged. Using the above code, I can read all the values, but it has one less iteration compared to the other strings. Here, how can I tell if this string has merged the cells / s?
  • Case 2: shown in table 2, here 2 rows were concatenated. While iterating, I am getting below error from tb.Rows Cannot access individual rows in this collection because the table has vertically merged cells. Here, how can I tell if the table was merged or not?
  • Case 3: shown in table 3. Here the table is inside the table. Using the above code, it only identifies one table and cellText = cell.Range.Text.ToString().Trim().Replace("\r\a", "")

    ; at the end of these lines, execution cellText

    gets all the values ​​of the current cell + inner table values. those. 2abcd. Here's How can I iterate over internal tables?
0


source to share


1 answer


You can determine if the cells are grouped by viewing the XML table. This example I put together parses an XML table and then finds the appropriate interaction cells. Everything turns into a two-dimensional array, which is then printed.

Hope this is a good start.



using System;
using System.Linq;
using System.Xml.Linq;
using Word = NetOffice.WordApi;

namespace TableTest
{
    class Program
    {
        static void Main(string[] args)
        {
            try
            {
                using (var app = Word.Application.GetActiveInstance())
                {
                    var document = app.ActiveDocument;
                    var documentTitle = $"* Tables in {document.Name} *";
                    Console.WriteLine(new string('*', documentTitle.Length));
                    Console.WriteLine(documentTitle);
                    Console.WriteLine(new string('*', documentTitle.Length));
                    Console.WriteLine();


                    for (int i = 1; i <= document.Tables.Count; i++)
                    {
                        var table = document.Tables[i];

                        var tableTitle = $"Table #{i}";

                        Console.WriteLine(tableTitle);
                        Console.WriteLine(new string('-', tableTitle.Length));

                        foreach (var cellInfo in CellInfo.GetInfosFromTable(table))
                        {
                            Console.WriteLine(" - " + cellInfo);
                        }

                        Console.WriteLine();
                    }
                }
            }
            catch (Exception ex)
            {
                Console.WriteLine(ex);
            }

            Console.WriteLine();
            Console.WriteLine("Done executing!");
            Console.ReadLine();
        }

        class CellInfo
        {
            public Word.Cell Cell { get; set; }
            public XElement XmlCell { get; set; }
            public int XmlRow { get; set; }
            public int XmlColumn { get; set; }
            public int Row { get; set; }
            public int Column { get; set; }
            public XElement MergedHorizontallyWith { get; set; }
            public XElement MergedVerticallyWith { get; set; }

            public override string ToString()
            {
                if (MergedHorizontallyWith == null && MergedVerticallyWith == null)
                {
                    var range = Cell?.Range;

                    var interopText = string.Empty;

                    if (!Equals(range, null))
                    {
                        interopText = range.Text;

                        //\r\a marks the end of a cell, \r and \n are normal line breaks
                        interopText = interopText.Replace("\r\a", "<>").Replace("\r", "\\r").Replace("\n", "\\n");

                        //Remove the last cell ending marker (it always there)
                        if (interopText.EndsWith("<>"))
                            interopText = interopText.Substring(0, interopText.Length - 2);
                    }

                    return $"xml: {Row}, {Column} (interop: {XmlRow}, {XmlColumn}): {XmlCell?.Value ?? string.Empty} = {interopText}";
                }
                else if (MergedHorizontallyWith != null)
                {
                    return $"xml: {Row}, {Column} (interop: {XmlRow}, {XmlColumn}): MERGED HORIZONTALLY";
                }
                else if (MergedVerticallyWith != null)
                {
                    return $"xml: {Row}, {Column} (interop: {XmlRow}, {XmlColumn}): MERGED VERTICALLY";
                }
                else
                {
                    return $"xml: {Row}, {Column} (interop: {XmlRow}, {XmlColumn}): this shouldn't happen";

                }
            }

            public static CellInfo[,] GetInfosFromTable(Word.Table table)
            {
                var doc = XDocument.Parse(table.Range.XML);

                CellInfo[,] cellInfos = GetInitializedArray(table);

                var xmlTable = doc.Descendants().First(n => n.Name.LocalName == "tbl");

                var rows = xmlTable.Elements().Where(e => e.Name.LocalName == "tr").ToArray();

                for (int r = 0; r < rows.Length; r++)
                {
                    var row = rows[r];
                    var rowCells = row.Elements().Where(e => e.Name.LocalName == "tc").ToArray();
                    var c = 0;
                    foreach (var rowCell in rowCells)
                    {
                        cellInfos[r, c].XmlCell = rowCell;
                        cellInfos[r, c].XmlRow = r;
                        cellInfos[r, c].XmlColumn = c;

                        var gridSpan = int.Parse(rowCell.Descendants().FirstOrDefault(d => d.Name.LocalName == "gridSpan")?.Attributes().FirstOrDefault(a => a.Name.LocalName == "val")?.Value ?? "1");

                        if (gridSpan > 1)
                        {
                            for (int i = 1; i < gridSpan; i++)
                            {
                                cellInfos[r, c + i].MergedHorizontallyWith = rowCell;
                                cellInfos[r, c + i].XmlRow = r;
                                cellInfos[r, c + i].XmlColumn = c + i;
                            }

                        }

                        c += gridSpan;
                    }
                }

                ApplyVerticalMerges(cellInfos);

                FindCorrespondingInteropCells(table, cellInfos);

                return cellInfos;
            }


            private static CellInfo[,] GetInitializedArray(Word.Table table)
            {
                var cellInfos = new CellInfo[table.Rows.Count, table.Columns.Count];
                for (int r = 0; r < cellInfos.GetLength(0); r++)
                {
                    for (int c = 0; c < cellInfos.GetLength(1); c++)
                    {
                        cellInfos[r, c] = new CellInfo();
                    }
                }

                return cellInfos;
            }

            private static void ApplyVerticalMerges(CellInfo[,] cellInfos)
            {
                for (int r = 0; r < cellInfos.GetLength(0); r++)
                {
                    for (int c = 0; c < cellInfos.GetLength(1); c++)
                    {
                        var cellInfo = cellInfos[r, c];


                        var vmerge = cellInfo.XmlCell?.Descendants().FirstOrDefault(d => d.Name.LocalName == "vmerge");
                        if (vmerge != null)
                        {
                            var isParent = (vmerge.Attributes().FirstOrDefault(a => a.Name.LocalName == "val")?.Value ?? string.Empty) == "restart";

                            if (isParent)
                            {
                                MarkCellsBelow(cellInfos, r, c);
                            }
                        }

                    }
                }
            }

            private static void MarkCellsBelow(CellInfo[,] cells, int parentR, int parentC)
            {
                var parentCell = cells[parentR, parentC];
                for (int r = parentR + 1; r < cells.GetLength(1); r++)
                {
                    var cell = cells[r, parentC];

                    var vmerge = cell.XmlCell?.Descendants().FirstOrDefault(d => d.Name.LocalName == "vmerge");
                    if (vmerge == null) break;

                    var isParent = (vmerge?.Attributes().FirstOrDefault(a => a.Name.LocalName == "val")?.Value ?? string.Empty) == "restart";
                    if (isParent) break;

                    cell.MergedVerticallyWith = parentCell.XmlCell;
                }

            }

            private static void FindCorrespondingInteropCells(Word.Table table, CellInfo[,] cellInfos)
            {
                var interopRow = 1;
                for (int r = 0; r < cellInfos.GetLength(0); r++)
                {
                    var interopCol = 0;
                    for (int c = 0; c < cellInfos.GetLength(1); c++)
                    {
                        var cellInfo = cellInfos[r, c];

                        if (cellInfo.MergedVerticallyWith != null)
                        {
                            interopCol++;
                        }

                        else
                        {
                            interopCol++;
                            cellInfo.Row = interopRow;
                            cellInfo.Column = interopCol;
                            cellInfo.Cell = GetCell(cellInfo, table);
                        }
                    }

                    interopRow++;
                }
            }

            private static Word.Cell GetCell(CellInfo cellInfo, Word.Table table)
            {
                foreach (var cell in table.Range.Cells)
                {
                    if (cell.NestingLevel == table.NestingLevel)
                    {
                        if (cellInfo.Column == cell.ColumnIndex && cellInfo.Row == cell.RowIndex)
                        {
                            return cell;
                        }
                    }
                }

                return null;
            }

        }

    }
}

      

If you want to know if a table contains only merged cells, you can use the Table.Uniform property.

+1


source







All Articles