blob: 4dd9c13c9f5f603451384420608cd9bfe4f80b65 [file] [log] [blame]
/* FILE: sub_min.cpp
* DATE MODIFIED: 31-Aug-07
* DESCRIPTION: Part of the SREC graph compiler project source files.
*
* Copyright 2007, 2008 Nuance Communciations, Inc. *
* *
* Licensed under the Apache License, Version 2.0 (the 'License'); *
* you may not use this file except in compliance with the License. *
* *
* You may obtain a copy of the License at *
* http://www.apache.org/licenses/LICENSE-2.0 *
* *
* Unless required by applicable law or agreed to in writing, software *
* distributed under the License is distributed on an 'AS IS' BASIS, *
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. *
* See the License for the specific language governing permissions and *
* limitations under the License. *
* *
*---------------------------------------------------------------------------*/
#include <iostream>
#include <string>
#include <assert.h>
#include <cstdio>
#include "sub_grph.h"
#define SYMBOL_COMPARE(x,y) (arc[x]->CompareSymbol(arc[y]))
#define COMPARE(x,y) (arc[x]->Compare(arc[y]))
// Minimization to facilitate moving output symbols - mainly for phoneme networks
// Check partial merge
// Move the output symbol if only one node
/*
static int checkEntry (int *itemList, int count, int item);
static int checkEntry (int *itemList, int count, int item)
{
for (int ii= 0; ii < count; ii++)
if (item == itemList[ii])
return ii;
return -1;
}
*/
void SubGraph::ViewNode (int currId)
{
int rix;
printf ("Node: %d\n", currId);
rix= FindFromIndex (currId);
if (rix < 0)
return;
while (rix < numArc && arc[forwardList[rix]]->GetFromId() == currId) {
arc[forwardList[rix]]->Print();
rix++;
}
return;
}
bool SubGraph::EquivalenceTestForward (int firstId, int secondId, int *equivMap)
{
int fix, six, fnxt, snxt, tof, tos, count;
assert (firstId != secondId);
fix= FindFromIndex (firstId);
six= FindFromIndex (secondId);
if (fix < 0 || six < 0)
return false;
count= 0;
do {
// Move to next valid transitions
while (fix < numArc && arc[forwardList[fix]]->GetFromId() == firstId
&& arc[forwardList[fix]]->GetToId() == DISCARD_LABEL)
fix++;
if (fix < numArc && arc[forwardList[fix]]->GetFromId() == firstId)
fnxt= arc[forwardList[fix]]->GetFromId();
else
fnxt= -1;
while (six < numArc && arc[forwardList[six]]->GetFromId() == secondId
&& arc[forwardList[six]]->GetToId() == DISCARD_LABEL)
six++;
if (six < numArc && arc[forwardList[six]]->GetFromId() == secondId)
snxt= arc[forwardList[six]]->GetFromId();
else
snxt= -1;
if (fnxt != firstId && snxt != secondId)
return true;
else if (fnxt != firstId || snxt != secondId)
return false;
tos= arc[forwardList[six]]->GetToId();
tof= arc[forwardList[fix]]->GetToId();
// printf ("Debug inner %d %d, %d %d\n", tof, tos, equivMap[tof], equivMap[tos]);
// if (tof >= 0) bogus assert
// assert (tof == equivMap[tof]);
// if (tos >= 0)
// assert (tos == equivMap[tos]);
// Test
if (!arc[forwardList[fix]]->HasSameLabels (arc[forwardList[six]])
|| tos != tof)
return false;
count++;
fix++;
six++;
} while (fnxt >= 0 && snxt >= 0);
return false;
}
void SubGraph::IdentifyEquivalence (int *depthMap, int *equivMap)
{
int ii, jj, dd, maxDepth, count, itCnt;
maxDepth= 0;
for (ii= 0; ii < numVertex; ii++) {
if (maxDepth < depthMap[ii])
maxDepth= depthMap[ii];
}
itCnt= 0;
do {
count= 0;
for (dd= 0; dd <= maxDepth; dd++)
for (ii= 0; ii < numVertex; ii++)
if (depthMap[ii] == dd && ii == equivMap[ii]) {
CheckForChangeAndResort (ii, equivMap);
for (jj= ii+1; jj < numVertex; jj++)
if (depthMap[jj] == dd && jj == equivMap[jj]) {
// Equivalence test
CheckForChangeAndResort (jj, equivMap);
// printf ("Try %d %d, ", ii, jj);
if (EquivalenceTestForward (ii, jj, equivMap)) {
equivMap[jj]= ii;
// printf ("Merged %d %d\n", ii, jj);
count++;
}
}
}
itCnt++;
// printf ("Total %d mergers\n", count);
} while (count > 0 && itCnt < MAXITS);
return;
}
void SubGraph::CheckForChangeAndResort (int currId, int *mapList)
{
int rix, rixBegin, nextId;
bool needSort;
needSort= false;
rixBegin= rix= FindFromIndex (currId);
if (rix < 0)
return;
while (rix < numArc && arc[forwardList[rix]]->GetFromId() == currId) {
nextId= arc[forwardList[rix]]->GetToId();
if (nextId >= 0 && mapList[nextId] != nextId) {
needSort= true;
arc[forwardList[rix]]->AssignToId(mapList[nextId]);
}
rix++;
}
// Resort
if (needSort)
RemoveDuplicatesAtNode (rixBegin, rix);
return;
}
void SubGraph::DeterminizeAtVertex (int baseId, DetCache *cache)
{
int fix, six, firstId, secondId, vertEnd;
fix= FindFromIndex (baseId);
if (fix < 0)
return;
// Remove duplicates
vertEnd= fix;
six= -1;
while (vertEnd < sortNum && arc[forwardList[vertEnd]]->GetFromId() == baseId) {
vertEnd++;
}
vertEnd++;
// Iteration over first node
firstId= -1;
while (fix < sortNum && arc[forwardList[fix]]->GetFromId() == baseId) {
// Iterator for firstId
while (fix < sortNum && arc[forwardList[fix]]->GetFromId() == baseId
&& (arc[forwardList[fix]]->GetToId() == firstId
|| arc[forwardList[fix]]->GetInput() == TERMINAL_LABEL
|| arc[forwardList[fix]]->GetInput() == DISCARD_LABEL))
fix++;
// Terminal Condition
if (fix >= sortNum || arc[forwardList[fix]]->GetFromId() != baseId)
break;
else
firstId= arc[forwardList[fix]]->GetToId();
// Iteration over second node
six= fix;
secondId= firstId;
while (six < sortNum && arc[forwardList[six]]->GetFromId() == baseId) {
// Iterator for secondId
while (six < sortNum && arc[forwardList[six]]->GetFromId() == baseId
&& (arc[forwardList[six]]->GetToId() == secondId
|| arc[forwardList[six]]->GetInput() == TERMINAL_LABEL
|| arc[forwardList[six]]->GetInput() == DISCARD_LABEL))
six++;
// Terminal condition
if (six >= sortNum || arc[forwardList[six]]->GetFromId() != baseId)
break;
else
secondId= arc[forwardList[six]]->GetToId();
// Now we have both Ids worked out
assert (firstId >= 0);
assert (secondId >= 0);
assert (arc[forwardList[fix]]->GetInput() != DISCARD_LABEL);
assert (arc[forwardList[six]]->GetInput() != DISCARD_LABEL);
if (PairwiseDeterminize (baseId, firstId, fix, secondId, six, cache) > 0) {
SortLanguageAtSortIndices (fix, vertEnd);
// Are we done with the first node?
while (fix < sortNum && arc[forwardList[fix]]->GetFromId() == baseId
&& arc[forwardList[fix]]->GetInput() == DISCARD_LABEL)
fix++;
// Terminal condition
if (fix >= sortNum || arc[forwardList[fix]]->GetFromId() != baseId
|| arc[forwardList[fix]]->GetToId() != firstId)
break;
}
}
}
return;
}
int SubGraph::PairwiseDeterminize (int baseId, int firstId, int fixStart, int secondId,
int sixStart, DetCache *cache)
{
int fix, six, fmiss, smiss, nmatch, symTst, newId;
bool isCached;
fix= fixStart;
six= sixStart;
assert (arc[forwardList[fix]]->GetInput() != DISCARD_LABEL);
assert (arc[forwardList[six]]->GetInput() != DISCARD_LABEL);
// Count
isCached= false;
fmiss= smiss= nmatch= 0;
newId= -1;
while (six < sortNum && fix < sortNum) {
assert (arc[forwardList[fix]]->GetInput() != DISCARD_LABEL);
assert (arc[forwardList[six]]->GetInput() != DISCARD_LABEL);
symTst= SYMBOL_COMPARE (forwardList[fix], forwardList[six]);
if (symTst == 0) {
if (newId == -1) {
newId= cache->QueryEntry (firstId, secondId);
if (newId < 0)
newId= NewVertexId ();
else
isCached= true;
// printf ("Forming %d with %d and %d at %d\n", newId, firstId, secondId, baseId);
}
// Assign second to new Vertex
arc[forwardList[six]]->AssignToId (newId);
// Assign first to DISCARD Index
arc[forwardList[fix]]->AssignInput (DISCARD_LABEL);
// Increment to next
do {
fix++;
} while (fix < sortNum && arc[forwardList[fix]]->GetInput() == DISCARD_LABEL);
if (fix >= sortNum || arc[forwardList[fix]]->GetFromId() != baseId
|| arc[forwardList[fix]]->GetToId() != firstId)
fix= sortNum;
do {
six++;
} while (six < sortNum && arc[forwardList[six]]->GetInput() == DISCARD_LABEL);
if (six >= sortNum || arc[forwardList[six]]->GetFromId() != baseId
|| arc[forwardList[six]]->GetToId() != secondId)
six= sortNum;
nmatch++;
}
else if (symTst < 0) {
do {
fix++;
} while (fix < sortNum && arc[forwardList[fix]]->GetInput() == DISCARD_LABEL);
if (fix >= sortNum || arc[forwardList[fix]]->GetFromId() != baseId
|| arc[forwardList[fix]]->GetToId() != firstId)
fix= sortNum;
fmiss++;
}
else if (symTst > 0) {
do {
six++;
} while (six < sortNum && arc[forwardList[six]]->GetInput() == DISCARD_LABEL);
if (six >= sortNum || arc[forwardList[six]]->GetFromId() != baseId
|| arc[forwardList[six]]->GetToId() != secondId)
six= sortNum;
smiss++;
}
}
// SortLanguageAtSortIndices (fixStart, fix);
if (newId >= 0) {
if (isCached == false) {
// numLast= numArc;
MergeVertices (newId, firstId, secondId);
cache->AddEntry (newId, firstId, secondId);
// UpdateVisitationCache (numLast);
}
assert (nmatch > 0);
}
// Update fan-in count
if (nmatch > 0) {
// printf ("Merging %d %d to create %d\n", firstId, secondId, newId);
for (int ii= 0; ii < nmatch; ii++) {
// IncNodeProperty (newId);
IncVisitationCache (newId);
DecVisitationCache (firstId);
DecVisitationCache (secondId);
}
}
return nmatch;
}
void SubGraph::MergeVertices (int newId, int firstId, int secondId)
{
int fix, six, symTst, numStart;
NUANArc *arcOne;
numStart= numArc;
fix= FindFromIndex (firstId);
six= FindFromIndex (secondId);
if (fix < 0 || six < 0) {
if (fix >= 0)
while (fix < sortNum && arc[forwardList[fix]]->GetFromId() == firstId) {
if (arc[forwardList[fix]]->GetInput() != DISCARD_LABEL)
InheritArc (arc[forwardList[fix]], newId);
fix++;
}
else if (six >= 0)
while (six < sortNum && arc[forwardList[six]]->GetFromId() == secondId) {
if (arc[forwardList[six]]->GetInput() != DISCARD_LABEL)
InheritArc (arc[forwardList[six]], newId);
six++;
}
}
else {
while (six < sortNum && fix < sortNum) {
symTst= SYMBOL_COMPARE (forwardList[fix], forwardList[six]);
if (symTst == 0) {
if (arc[forwardList[fix]]->GetToId() == firstId
&& arc[forwardList[six]]->GetToId() == secondId) {
arcOne= InheritArc (arc[forwardList[fix]], newId);
arcOne->AssignToId (newId);
}
else if (arc[forwardList[fix]]->GetToId()
== arc[forwardList[six]]->GetToId()) {
InheritArc (arc[forwardList[fix]], newId);
}
else {
InheritArc (arc[forwardList[fix]], newId);
InheritArc (arc[forwardList[six]], newId);
}
// Increment to next
do {
fix++;
} while (fix < sortNum && arc[forwardList[fix]]->GetInput() == DISCARD_LABEL);
if (fix >= sortNum || arc[forwardList[fix]]->GetFromId() != firstId
|| arc[forwardList[fix]]->GetFromId() != firstId)
fix= sortNum;
do {
six++;
} while (six < sortNum && arc[forwardList[six]]->GetInput() == DISCARD_LABEL);
if (six >= sortNum || arc[forwardList[six]]->GetFromId() != secondId)
six= sortNum;
}
else if (symTst < 0) {
InheritArc (arc[forwardList[fix]], newId);
do {
fix++;
} while (fix < sortNum && arc[forwardList[fix]]->GetInput() == DISCARD_LABEL);
if (fix >= sortNum || arc[forwardList[fix]]->GetFromId() != firstId
|| arc[forwardList[fix]]->GetFromId() != firstId)
fix= sortNum;
}
else if (symTst > 0) {
InheritArc (arc[forwardList[six]], newId);
do {
six++;
} while (six < sortNum && arc[forwardList[six]]->GetInput() == DISCARD_LABEL);
if (six >= sortNum || arc[forwardList[six]]->GetFromId() != secondId
|| arc[forwardList[six]]->GetFromId() != secondId)
six= sortNum;
}
}
while (fix < sortNum && arc[forwardList[fix]]->GetFromId() == firstId) {
if (arc[forwardList[fix]]->GetInput() != DISCARD_LABEL)
InheritArc (arc[forwardList[fix]], newId);
fix++;
}
while (six < sortNum && arc[forwardList[six]]->GetFromId() == secondId) {
if (arc[forwardList[six]]->GetInput() != DISCARD_LABEL)
InheritArc (arc[forwardList[six]], newId);
six++;
}
}
// Update the sort list
UpdateSortForLanguage ();
// RemoveDuplicatesAtNode (numStart, numArc);
// ViewNode (newId);
assert (CheckSort());
// printf ("Merging %d %d to create %d\n", firstId, secondId, newId);
return;
}
void SubGraph::SetupVisitationCache ()
{
int ii;
CreateNodeProperty ();
for (ii= 0; ii < numArc; ii++)
if (arc[ii]->GetInput() != DISCARD_LABEL && arc[ii]->GetToId() >= 0)
IncNodeProperty (arc[ii]->GetToId());
return;
}
void SubGraph::ClearVisitationCache ()
{
DeleteNodeProperty ();
return;
}
void SubGraph::UpdateVisitationCache (int startNo)
{
int ii;
for (ii= startNo; ii < numArc; ii++)
if (arc[ii]->GetInput() != DISCARD_LABEL && arc[ii]->GetToId() >= 0) {
IncNodeProperty (arc[ii]->GetToId());
// std::cout << " (" << arc[ii]->GetToId() << " " << QueryNodeProperty (arc[ii]->GetToId()) << ") ";
}
// std::cout << std::endl;
return;
}
void SubGraph::DecVisitationCache (int currId)
{
int rix;
DecNodeProperty (currId);
// std::cout << " [" << currId << " " << QueryNodeProperty (currId) << "] ";
if (QueryNodeProperty (currId) <= 0) {
// std::cout << " [" << currId << "] ";
rix= FindFromIndex (currId);
if (rix < 0)
return;
while (rix < sortNum && arc[forwardList[rix]]->GetFromId() == currId) {
if (arc[forwardList[rix]]->GetInput() != DISCARD_LABEL
&& arc[forwardList[rix]]->GetToId() >= 0) {
if (arc[forwardList[rix]]->GetFromId() == arc[forwardList[rix]]->GetToId())
DecNodeProperty (currId);
else if (QueryNodeProperty (arc[forwardList[rix]]->GetToId()) > 0)
DecVisitationCache (arc[forwardList[rix]]->GetToId());
}
rix++;
}
}
return;
}
void SubGraph::IncVisitationCache (int currId)
{
int rix;
if (QueryNodeProperty (currId) <= 0) {
IncNodeProperty (currId);
// std::cout << " (" << currId << ") ";
rix= FindFromIndex (currId);
if (rix < 0)
return;
while (rix < sortNum && arc[forwardList[rix]]->GetFromId() == currId) {
if (arc[forwardList[rix]]->GetInput() != DISCARD_LABEL
&& arc[forwardList[rix]]->GetToId() >= 0) {
// IncNodeProperty (arc[forwardList[rix]]->GetToId());
// if (currId != arc[forwardList[rix]]->GetToId())
IncVisitationCache (arc[forwardList[rix]]->GetToId());
}
rix++;
}
}
else
IncNodeProperty (currId);
// std::cout << " (" << currId << " " << QueryNodeProperty (currId) << ") ";
return;
}
int SubGraph::VisitationConsistencyCheck ()
{
int ii, failCount;
int *nodeCount= new int [numVertex];
UpdateVertexCount (0);
// std::cout << "Count: ";
for (ii= 0; ii <numVertex; ii++) {
// std::cout << ii << " (" << vertexProp[ii] << ") ";
nodeCount[ii]= 0;
}
// std::cout << std::endl;
for (ii= 0; ii <numArc; ii++)
if (arc[ii]->GetInput() != DISCARD_LABEL && arc[ii]->GetToId() >= 0
&& (vertexProp[arc[ii]->GetFromId()] > 0 || arc[ii]->GetFromId() == startId))
nodeCount[arc[ii]->GetToId()]++;
failCount= 0;
// std::cout << "Failure list: ";
for (ii= 0; ii <numVertex; ii++)
if (vertexProp[ii] != nodeCount[ii]) {
// std::cout << ii << " (" << vertexProp[ii] << " " << nodeCount[ii] << ") ";
failCount++;
}
// std::cout << std::endl;
// return failCount;
delete [] nodeCount;
return 0;
}