The Blog of Ian Mercer.

A strongly-typed, RegEx-based parser for handling input strings

Cover Image for A strongly-typed, RegEx-based parser for handling input strings

Quite often I am faced with having to parse a string coming from some other system in the home. These often have odd delimiter characters in them, for example, "# 123 VO256 SP256+". I used to have a lot of code that attempts to parse such strings using String.Split() and int.TryParse() and a whole lot of code to check that the results are valid. But some time ago I switched to the class below that takes a regular expression defining the groups to parse and then provides a strongly typed method to extract the values.

For example, you can parse that string I just mentioned using this:

    var sp = new Parser("# (d+) VO(d+) SP(d+)\+");
	int a, b, c;
    bool ok = sp.Parse<int, int, int>("# 123 VO256 SP256+", out a, out b, out c);

Below is the parser class. Of note is the way the conversion is handled from a matched string to the type specified using TypeDescriptor.GetConverter(). Doing it this way allows for a wide variety of different types to be handled.

/// <summary>
/// A strongly typed parse result containing up to 5 elements, each individually strongly typed
/// </summary>
public class Parser
{
    readonly Regex regex;
    public Parser(string regularExpression)
    {
        this.regex = new Regex(regularExpression, RegexOptions.Compiled);
    }

    public bool Parse<T>(string input, out T value1)
    {
        bool ok = true;
        var match = this.regex.Match(input);
        ok = Assign(match, 1, out value1) && ok;
        return ok;
    }

    public bool Parse<T1, T2>(string input, out T1 value1, out T2 value2)
    {
        bool ok = true;
        var match = this.regex.Match(input);
        ok = Assign(match, 1, out value1) && ok;
        ok = Assign(match, 2, out value2) && ok;
        return ok;
    }

    public bool Parse<T1, T2, T3>(string input, out T1 value1, out T2 value2, out T3 value3)
    {
        bool ok = true;
        var match = this.regex.Match(input);
        ok = Assign(match, 1, out value1) && ok;
        ok = Assign(match, 2, out value2) && ok;
        ok = Assign(match, 3, out value3) && ok;
        return ok;
    }

    public bool Parse<T1, T2, T3, T4>(string input, out T1 value1, out T2 value2, out T3 value3, out T4 value4)
    {
        bool ok = true;
        var match = this.regex.Match(input);
        ok = Assign(match, 1, out value1) && ok;
        ok = Assign(match, 2, out value2) && ok;
        ok = Assign(match, 3, out value3) && ok;
        ok = Assign(match, 4, out value4) && ok;
        return ok;
    }

    public bool Parse<T1, T2, T3, T4, T5>(string input, out T1 value1, out T2 value2, out T3 value3, out T4 value4, out T5 value5)
    {
        bool ok = true;
        var match = this.regex.Match(input);
        ok = Assign(match, 1, out value1) && ok;
        ok = Assign(match, 2, out value2) && ok;
        ok = Assign(match, 3, out value3) && ok;
        ok = Assign(match, 4, out value4) && ok;
        ok = Assign(match, 5, out value5) && ok;
        return ok;
    }

    public bool Parse<T1, T2, T3, T4, T5, T6>(string input, out T1 value1, out T2 value2, out T3 value3, out T4 value4, out T5 value5, out T6 value6)
    {
        bool ok = true;
        var match = this.regex.Match(input);
        ok = Assign(match, 1, out value1) && ok;
        ok = Assign(match, 2, out value2) && ok;
        ok = Assign(match, 3, out value3) && ok;
        ok = Assign(match, 4, out value4) && ok;
        ok = Assign(match, 5, out value5) && ok;
        ok = Assign(match, 6, out value6) && ok;
        return ok;
    }

    public bool Parse<T1, T2, T3, T4, T5, T6, T7>(string input, out T1 value1, out T2 value2, out T3 value3, out T4 value4, out T5 value5, out T6 value6, out T7 value7)
    {
        bool ok = true;
        var match = this.regex.Match(input);
        ok = Assign(match, 1, out value1) && ok;
        ok = Assign(match, 2, out value2) && ok;
        ok = Assign(match, 3, out value3) && ok;
        ok = Assign(match, 4, out value4) && ok;
        ok = Assign(match, 5, out value5) && ok;
        ok = Assign(match, 6, out value6) && ok;
        ok = Assign(match, 7, out value7) && ok;
        return ok;
    }

    public bool Parse<T1, T2, T3, T4, T5, T6, T7, T8>(string input, out T1 value1, out T2 value2, out T3 value3, out T4 value4, out T5 value5, out T6 value6, out T7 value7, out T8 value8)
    {
        bool ok = true;
        var match = this.regex.Match(input);
        ok = Assign(match, 1, out value1) && ok;
        ok = Assign(match, 2, out value2) && ok;
        ok = Assign(match, 3, out value3) && ok;
        ok = Assign(match, 4, out value4) && ok;
        ok = Assign(match, 5, out value5) && ok;
        ok = Assign(match, 6, out value6) && ok;
        ok = Assign(match, 7, out value7) && ok;
        ok = Assign(match, 8, out value8) && ok;
        return ok;
    }

    public bool Parse<T1, T2, T3, T4, T5, T6, T7, T8, T9>(string input, out T1 value1, out T2 value2, out T3 value3, out T4 value4, out T5 value5, out T6 value6, out T7 value7, out T8 value8, out T9 value9)
    {
        bool ok = true;
        var match = this.regex.Match(input);
        ok = Assign(match, 1, out value1) && ok;
        ok = Assign(match, 2, out value2) && ok;
        ok = Assign(match, 3, out value3) && ok;
        ok = Assign(match, 4, out value4) && ok;
        ok = Assign(match, 5, out value5) && ok;
        ok = Assign(match, 6, out value6) && ok;
        ok = Assign(match, 7, out value7) && ok;
        ok = Assign(match, 8, out value8) && ok;
        ok = Assign(match, 9, out value9) && ok;
        return ok;
    }

    public bool Parse<T1, T2, T3, T4, T5, T6, T7, T8, T9, T10>(string input, out T1 value1, out T2 value2, out T3 value3, out T4 value4, out T5 value5, out T6 value6, out T7 value7, out T8 value8, out T9 value9, out T10 value10)
    {
        bool ok = true;
        var match = this.regex.Match(input);
        ok = Assign(match, 1, out value1) && ok;
        ok = Assign(match, 2, out value2) && ok;
        ok = Assign(match, 3, out value3) && ok;
        ok = Assign(match, 4, out value4) && ok;
        ok = Assign(match, 5, out value5) && ok;
        ok = Assign(match, 6, out value6) && ok;
        ok = Assign(match, 7, out value7) && ok;
        ok = Assign(match, 8, out value8) && ok;
        ok = Assign(match, 9, out value9) && ok;
        ok = Assign(match, 10, out value10) && ok;
        return ok;
    }

    private bool Assign<X>(Match match, int index, out X value)
    {
        if (match.Success)
        {
            Group group = match.Groups[index];
            var stringValue = group.Value;
            var foo = TypeDescriptor.GetConverter(typeof(X));
            value = (X)(foo.ConvertFromInvariantString(stringValue));
            return true;
        }
        else
        {
            value = default(X);
            return false;
        }
    }
}

Related Stories

Cover Image for My love/hate relationship with Stackoverflow

My love/hate relationship with Stackoverflow

Stackoverflow is a terrific source of information but can also be infuriating.

Ian Mercer
Ian Mercer
Cover Image for Xamarin Forms Application For Home Automation

Xamarin Forms Application For Home Automation

Building a Xamarin Forms application to control my home automation system

Ian Mercer
Ian Mercer

JSON Patch - a C# implementation

Ian Mercer
Ian Mercer

Websites should stop using passwords for login!

A slightly radical idea to eliminate passwords from many of the websites you use just occasionally

Ian Mercer
Ian Mercer

Dynamically building 'Or' Expressions in LINQ

How to create a LINQ expression that logically ORs together a set of predicates

Ian Mercer
Ian Mercer

VariableWithHistory - making persistence invisible, making history visible

A novel approach to adding history to variables in a programming language

Ian Mercer
Ian Mercer

Neo4j Meetup in Seattle - some observations

Some observations from a meetup in Seattle on graph databases and Neo4j

Ian Mercer
Ian Mercer

Updated Release of the Abodit State Machine

A hierarchical state machine for .NET

Ian Mercer
Ian Mercer

My first programme [sic]

At the risk of looking seriously old, here's something found on a paper tape

Ian Mercer
Ian Mercer

Building a better .NET State Machine

A state machine for .NET that I've released on Nuget

Ian Mercer
Ian Mercer
Cover Image for The Internet of Dogs

The Internet of Dogs

Connecting our dog into the home automation

Ian Mercer
Ian Mercer

A simple state machine in C#

State machines are useful in many contexts but especially for home automation

Ian Mercer
Ian Mercer

Convert a property getter to a setter

Ian Mercer
Ian Mercer

MongoDB Map-Reduce - Hints and Tips

Ian Mercer
Ian Mercer
Cover Image for Weather Forecasting for Home Automation

Weather Forecasting for Home Automation

Ian Mercer
Ian Mercer

Lengthening short Urls in C#

Ian Mercer
Ian Mercer

Why don't you trust your build system?

Ian Mercer
Ian Mercer

ASP.NET MVC SEO - Solution Part 1

Ian Mercer
Ian Mercer

Elliott 803 - An Early Computer

Ian Mercer
Ian Mercer

Building sitemap.xml for SEO ASP.NET MVC

Ian Mercer
Ian Mercer

Continuous Integration -> Continuous Deployment

What is "quality" in terms of a released software product or website?

Ian Mercer
Ian Mercer

Making a bootable Windows 7 USB Memory Stick

Here's how I made a bootable USB memory stick for Windows 7

Ian Mercer
Ian Mercer

Tip: getting the index in a foreeach statement

A tip on using LINQ's Select expression with an index

Ian Mercer
Ian Mercer

SQL Server - error: 18456, severity: 14, state: 38 - Incorrect Login

A rant about developers using the same message for different errors

Ian Mercer
Ian Mercer

WCF and the SYSTEM account

Namespace reservations and http.sys, my, oh my!

Ian Mercer
Ian Mercer

404 errors on IIS6 with ASP.NET 4 Beta 2

Ian Mercer
Ian Mercer

Mixed mode assembly errors after upgrade to .NET 4 Beta 2

Fixing this error was fairly simple

Ian Mercer
Ian Mercer

The EntityContainer name could not be determined

How to fix the exception "the entitycontainer" name could not be determined

Ian Mercer
Ian Mercer

Shortened URLs should be treated like a Codec ...

Expanding URLs would help users decide whether or not to click a link

Ian Mercer
Ian Mercer

Tagging File Systems

Isn't it time we stopped knowing which drive our file is on?

Ian Mercer
Ian Mercer

A great site for developing and testing regular expressions

Just a link to a site I found useful

Ian Mercer
Ian Mercer

Introducing Jigsaw menus

A novel UI for menus that combines a breadcrumb and a menu in one visual metaphor

Ian Mercer
Ian Mercer

Entity Framework in .NET 4

Ian Mercer
Ian Mercer

Fix for IE's overflow:hidden problem

Ian Mercer
Ian Mercer

A better Tail program for Windows

A comparison of tail programs for Windows

Ian Mercer
Ian Mercer

Measuring website browser performance

Found this great resource on website performance

Ian Mercer
Ian Mercer

Amazon Instance vs Dedicated Server comparison

Some benchmark performance for Amazon vs a dedicated server

Ian Mercer
Ian Mercer

System.Data.EntitySqlException

Hints for dealing with this exception

Ian Mercer
Ian Mercer

Agile Software Development is Like Sailing

You cannot tack too often when sailing or you get nowhere. Agile is a bit like that.

Ian Mercer
Ian Mercer

Exception Handling using Exception.Data

My latest article on CodeProject covers the lesser known Exception.Data property

Ian Mercer
Ian Mercer

Javascript error reporting

Sending client-side errors back to a server for analysis

Ian Mercer
Ian Mercer

AntiVirus Software is the Worst Software!

When your anti-virus software starts stealing your personal data, it's time to remove it!

Ian Mercer
Ian Mercer

ASP.NET Custom Validation

How to solve a problem encountered with custom validation in ASP.NET

Ian Mercer
Ian Mercer

Optimization Advice

Some advice on software optimization

Ian Mercer
Ian Mercer

Linq's missing link

LinqKit came in handy back in 2009

Ian Mercer
Ian Mercer

Google Chart API

Ian Mercer
Ian Mercer

Cache optimized scanning of pairwise combinations of values

Using space-filling curves to optimize caching

Ian Mercer
Ian Mercer

Threading and User Interfaces

A rant about how few software programs get threading right

Ian Mercer
Ian Mercer

Take out the trash!

Why Windows shutdown takes so long

Ian Mercer
Ian Mercer

Dell upgrades - a pricey way to go

Ian Mercer
Ian Mercer

Programming mostly C#

Ian's advice on programming

Ian Mercer
Ian Mercer