/* * Copyright 2016 Christoph Böhme * * Licensed under the Apache License, Version 2.0 the "License"; * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package org.culturegraph.mf.strings; import static org.mockito.ArgumentMatchers.any; import static org.mockito.ArgumentMatchers.eq; import static org.mockito.Mockito.inOrder; import static org.mockito.Mockito.never; import static org.mockito.Mockito.verify; import static org.mockito.Mockito.verifyZeroInteractions; import org.culturegraph.mf.framework.StreamReceiver; import org.junit.Before; import org.junit.Test; import org.mockito.InOrder; import org.mockito.Mock; import org.mockito.MockitoAnnotations; /** * Tests for class {@link RegexDecoder}. * * @author Christoph Böhme (rewrite) * @author Thomas Seidel * */ public final class RegexDecoderTest { @Mock private StreamReceiver receiver; @Before public void setup() { MockitoAnnotations.initMocks(this); } @Test public void shouldEmitStartAndEndRecordForMatchingInput() { final RegexDecoder regexDecoder = new RegexDecoder(".*"); regexDecoder.setReceiver(receiver); regexDecoder.process("matching input"); final InOrder ordered = inOrder(receiver); ordered.verify(receiver).startRecord(any()); ordered.verify(receiver).endRecord(); } @Test public void shouldIgnoreNonMatchingInput() { final RegexDecoder regexDecoder = new RegexDecoder("abc"); regexDecoder.setReceiver(receiver); regexDecoder.process("non-matching input"); verifyZeroInteractions(receiver); } @Test public void shouldUseCaptureGroupNamedIdAsRecordId() { final RegexDecoder regexDecoder = new RegexDecoder("ID:(?<id>.*)"); regexDecoder.setReceiver(receiver); regexDecoder.process("ID:id-123"); verify(receiver).startRecord("id-123"); } @Test public void shouldUseEmptyStringAsRecordIdIfNoRecordIdCaptureGroupExists() { final RegexDecoder regexDecoder = new RegexDecoder("ID:(?<identifier>.*)"); regexDecoder.setReceiver(receiver); regexDecoder.process("ID:id-123"); verify(receiver).startRecord(""); } @Test public void shouldUseEmptyStringAsRecordIdIfRecordIdCaptureGroupDoesNotMatch() { final RegexDecoder regexDecoder = new RegexDecoder("ID:(?<id>[0-9]*).*"); regexDecoder.setReceiver(receiver); regexDecoder.process("ID:id-123"); verify(receiver).startRecord(""); } @Test public void shouldEmitLiteralContainingUnmodifiedInputIfRawInputLiteralIsSet() { final RegexDecoder regexDecoder = new RegexDecoder(".*"); regexDecoder.setReceiver(receiver); regexDecoder.setRawInputLiteral("input"); regexDecoder.process("foo=1234,bar=abcd"); verify(receiver).literal("input", "foo=1234,bar=abcd"); } @Test public void shouldUseGroupNameAsLiteralNameForNamedCaptureGroups() { final RegexDecoder regexDecoder = new RegexDecoder( "foo=(?<foo>[0-9]+),bar=(?<bar>[a-z]+)"); regexDecoder.setReceiver(receiver); regexDecoder.process("foo=1234,bar=abcd"); final InOrder ordered = inOrder(receiver); ordered.verify(receiver).literal("foo", "1234"); ordered.verify(receiver).literal("bar", "abcd"); } @Test public void shouldOutputLiteralsForEachMatchOfPattern() { final RegexDecoder regexDecoder = new RegexDecoder( "foo=(?<foo>[0-9]+),bar=(?<bar>[a-z]+)"); regexDecoder.setReceiver(receiver); regexDecoder.process("foo=1234,bar=abcd,foo=5678,bar=efgh"); final InOrder ordered = inOrder(receiver); ordered.verify(receiver).literal("foo", "1234"); ordered.verify(receiver).literal("bar", "abcd"); ordered.verify(receiver).literal("foo", "5678"); ordered.verify(receiver).literal("bar", "efgh"); } @Test public void shouldIgnoreNonMatchingPartsOfInputString() { final RegexDecoder regexDecoder = new RegexDecoder( "foo=(?<foo>[0-9]+)"); regexDecoder.setReceiver(receiver); regexDecoder.process("foo=1234,bar=abcd,foo=5678,bar=efgh"); final InOrder ordered = inOrder(receiver); ordered.verify(receiver).literal("foo", "1234"); ordered.verify(receiver, never()).literal("bar", "abcd"); ordered.verify(receiver).literal("foo", "5678"); ordered.verify(receiver, never()).literal("bar", "efgh"); } @Test public void shouldIgnoreUnnamedCaptureGroups() { final RegexDecoder regexDecoder = new RegexDecoder( "foo=([0-9]+),bar=(?<bar>[a-z]+)"); regexDecoder.setReceiver(receiver); regexDecoder.process("foo=1234,bar=abcd,foo=5678,bar=efgh"); verify(receiver, never()).literal(any(), eq("1234")); verify(receiver, never()).literal(any(), eq("5678")); } }