Skip to content

Commit

Permalink
Merge branch 'master' of https://github.com/Microsoft/CNTK
Browse files Browse the repository at this point in the history
  • Loading branch information
Dong Yu committed Jan 22, 2016
2 parents 7ff3d37 + 59287d0 commit 2374adc
Show file tree
Hide file tree
Showing 33 changed files with 1,062 additions and 1,262 deletions.
4 changes: 2 additions & 2 deletions Source/CNTK/ModelEditLanguage.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -138,12 +138,12 @@ void MELScript<ElemType>::CallFunction(const std::string& p_name, const ConfigPa
std::wstring modelFormat = GetOptionalModelFormat(params, numFixedParams);

auto cn = make_shared<ComputationNetwork>(CPUDEVICE);
#if 1 // support for a specific kind of legacy format, for the sole purpose of allowing users to convert (=load & save) them
#if 1 // support for a specific kind of legacy format, for the sole purpose of allowing users to convert (=load & save) them
if (modelFormat == L"cntk_legacy_no_tensorlib")
{
cn->Read<ElemType>(params[1]);
for (auto node : cn->FeatureNodes())
node->SetDims(TensorShape(node->GetNumRows()), 0); // pre-tensorlib InputValues had incorrect tensor dimensions
node->SetDims(TensorShape(node->GetSampleMatrixNumRows()), node->HasMBLayout()); // pre-tensorlib InputValues had incorrect tensor dimensions
cn->CompileNetwork();
}
else
Expand Down
9 changes: 0 additions & 9 deletions Source/CNTK/NDLUtil.h
Original file line number Diff line number Diff line change
Expand Up @@ -31,12 +31,6 @@ class NDLUtil
{
}

// FixupInputMinibatchSize - go through all the inputs and make sure they have a consistent minibatch size
void FixupInputMinibatchSize()
{
m_net->FixupInputMinibatchSize();
}

// ProcessNDLConfig - Process the NDL script from a configuration string value
// config - configuration string containing script
void ProcessNDLConfig(const ConfigValue& config, bool fullValidate = false)
Expand Down Expand Up @@ -105,10 +99,7 @@ class NDLUtil
SynchronousNodeEvaluator<ElemType> ndlEvaluator(m_net);
NDLNode<ElemType>* lastNode = script->Evaluate(ndlEvaluator, L"", ndlPass, skipThrough);
if (ndlPass == ndlPassResolve)
{
SetOutputNodes(script);
FixupInputMinibatchSize();
}
return lastNode;
}

Expand Down
16 changes: 8 additions & 8 deletions Source/CNTK/SimpleNetworkBuilder.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -1753,7 +1753,7 @@ ComputationNetworkPtr SimpleNetworkBuilder<ElemType>::BuildUnidirectionalLSTMNet
input = output;
}

size_t idim = input->GetNumRows();
size_t idim = input->GetSampleMatrixNumRows();
assert(m_lookupTabelOrderSizes.size() == m_streamSizes.size());

e = builder.CreateLearnableParameter(msra::strfun::wstrprintf(L"Embedding%d", idx), m_layerSizes[1], idim / m_lookupTabelOrderSizes[idx]);
Expand Down Expand Up @@ -2069,7 +2069,7 @@ ComputationNetworkPtr SimpleNetworkBuilder<ElemType>::BuildBiDirectionalLSTMNetw
input = output;
}

size_t idim = input->GetNumRows();
size_t idim = input->GetSampleMatrixNumRows();
assert(m_lookupTabelOrderSizes.size() == m_streamSizes.size());

e = builder.CreateLearnableParameter(msra::strfun::wstrprintf(L"Embedding%d", idx), m_layerSizes[1], idim / m_lookupTabelOrderSizes[idx]);
Expand Down Expand Up @@ -2295,7 +2295,7 @@ ComputationNetworkPtr SimpleNetworkBuilder<ElemType>::BuildNetworkFromDbnFile(co
unsigned long randomSeed = 1;

ComputationNodePtr input, w, b, output, label, prior, scaledLogLikelihood;
shared_ptr<PreComputedNode<ElemType>> pcNodePtr;
shared_ptr<PreComputedNodeBase<ElemType>> pcNodePtr;

File fstream(dbnModelFileName, FileOptions::fileOptionsBinary | FileOptions::fileOptionsRead);

Expand Down Expand Up @@ -2354,11 +2354,11 @@ ComputationNetworkPtr SimpleNetworkBuilder<ElemType>::BuildNetworkFromDbnFile(co
contextStdDev.TransferFromDeviceToDevice(CPUDEVICE, m_deviceId, true, false, false);

w = builder.Mean(input, L"MeanOfFeatures");
static_pointer_cast<PreComputedNode<ElemType>>(w)->SideLoadFromMatrix(contextMean);
static_pointer_cast<PreComputedNodeBase<ElemType>>(w)->SideLoadFromMatrix(contextMean);
w->SetParameterUpdateRequired(false);

b = builder.InvStdDev(input, L"InvStdOfFeatures");
static_pointer_cast<PreComputedNode<ElemType>>(b)->SideLoadFromMatrix(contextStdDev);
static_pointer_cast<PreComputedNodeBase<ElemType>>(b)->SideLoadFromMatrix(contextStdDev);
b->SetParameterUpdateRequired(false);

output = builder.PerDimMeanVarNormalization(input, w, b, L"MVNormalizedFeatures");
Expand Down Expand Up @@ -2418,7 +2418,7 @@ ComputationNetworkPtr SimpleNetworkBuilder<ElemType>::BuildNetworkFromDbnFile(co
assert(priorVals.GetNumCols() == 1 && priorVals.GetNumRows() == m_outputLayerSize);

prior = builder.Mean(label, L"Prior");
static_pointer_cast<PreComputedNode<ElemType>>(prior)->SideLoadFromMatrix(priorVals);
static_pointer_cast<PreComputedNodeBase<ElemType>>(prior)->SideLoadFromMatrix(priorVals);
prior->SetParameterUpdateRequired(false);
}
else // pretrained network - need to add output layer, initalize
Expand All @@ -2431,7 +2431,7 @@ ComputationNetworkPtr SimpleNetworkBuilder<ElemType>::BuildNetworkFromDbnFile(co
else
std::runtime_error("Output layer size must be specified when converting pretrained network, use outputLayerSize=");

size_t penultimateSize = input->GetNumRows();
size_t penultimateSize = input->GetSampleMatrixNumRows();

wstring nameOfW = msra::strfun::wstrprintf(L"W%d", i);
wstring nameOfB = msra::strfun::wstrprintf(L"B%d", i);
Expand All @@ -2450,7 +2450,7 @@ ComputationNetworkPtr SimpleNetworkBuilder<ElemType>::BuildNetworkFromDbnFile(co
{
Matrix<ElemType> zeros = Matrix<ElemType>::Zeros(outputLayerSize, 1, m_deviceId);
prior = builder.Mean(label, L"Prior");
static_pointer_cast<PreComputedNode<ElemType>>(prior)->MarkComputed(false);
static_pointer_cast<PreComputedNodeBase<ElemType>>(prior)->MarkComputed(false);
prior->Value().SetValue(zeros);
}
}
Expand Down
8 changes: 4 additions & 4 deletions Source/CNTK/SynchronousExecutionEngine.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -313,7 +313,7 @@ void SynchronousNodeEvaluator<ElemType>::Evaluate(NDLNode<ElemType>* node, const
cnNodeType == OperationNameOf(FutureValueNode))
{
if (parameter.size() < 2 || parameter.size() > 3) // we allow 3 for legacy (cols parameter which is now unused)
RuntimeError("PastValue or FutureValue should have two to three fixed parameters. Usage: PastValue(rows, input, [timeStep=1, defaultPastValue=0.1]).");
RuntimeError("PastValue or FutureValue should have two to three fixed parameters. Usage: PastValue(rows, input, [timeStep=1, defaultHiddenActivity=0.1]).");
// TODO: allow a tensor descriptor. Or allow 0 (inference). Maybe already supported--check this.

nodeParamCount = 1; // number of inputs
Expand Down Expand Up @@ -346,7 +346,7 @@ void SynchronousNodeEvaluator<ElemType>::Evaluate(NDLNode<ElemType>* node, const
else if (cnNodeType == OperationNameOf(ConvolutionNode))
{
if (parameter.size() != 7)
RuntimeError("%ls should have 7 fixed parameters[weightNodeName, inputValueNodeName, kernelWidth, kernelHeight, outputChannels,horizontalSubsample, verticalSubsample] and two optional parameters [zeroPadding = [false|yourvalue], maxTempMemSizeInSamples = [0|yourvalue]].", cnNodeType.c_str());
RuntimeError("%ls should have 7 fixed parameters[weightNodeName, inputValueNodeName, kernelWidth, kernelHeight, outputChannels,horizontalSubsample, verticalSubsample] and two optional parameters [zeroPadding = [false|yourvalue], maxTempMemSizeInSamples = [0|yourvalue], imageLayout = \"HWC\"|\"cudnn\"].", cnNodeType.c_str());

// setup the parameter position of children so we can hook them up later
nodeParamCount = 2;
Expand Down Expand Up @@ -378,7 +378,7 @@ void SynchronousNodeEvaluator<ElemType>::Evaluate(NDLNode<ElemType>* node, const
else if (cnNodeType == OperationNameOf(MaxPoolingNode))
{
if (parameter.size() != 5)
RuntimeError("%ls should have 5 parameters[inputValueNodeName, windowWidth, windowHeight, horizontalSubsample, verticalSubsample].", cnNodeType.c_str());
RuntimeError("%ls should have 5 parameters[inputValueNodeName, windowWidth, windowHeight, horizontalSubsample, verticalSubsample, imageLayout = \"HWC\"|\"cudnn\"].", cnNodeType.c_str());

// setup the parameter position of children so we can hook them up later
nodeParamCount = 1;
Expand Down Expand Up @@ -406,7 +406,7 @@ void SynchronousNodeEvaluator<ElemType>::Evaluate(NDLNode<ElemType>* node, const
else if (cnNodeType == OperationNameOf(AveragePoolingNode))
{
if (parameter.size() != 5)
RuntimeError("%ls should have 5 parameters[inputValueNodeName, windowWidth, windowHeight, horizontalSubsample, verticalSubsample].", cnNodeType.c_str());
RuntimeError("%ls should have 5 parameters[inputValueNodeName, windowWidth, windowHeight, horizontalSubsample, verticalSubsample, imageLayout = \"HWC\"|\"cudnn\"].", cnNodeType.c_str());

// setup the parameter position of children so we can hook them up later
nodeParamCount = 1;
Expand Down
6 changes: 6 additions & 0 deletions Source/Common/Include/ProgressTracing.h
Original file line number Diff line number Diff line change
Expand Up @@ -44,6 +44,12 @@ namespace Microsoft { namespace MSR { namespace CNTK {
} // wrap static state in an accessor, so we won't need a CPP file

public:

static bool IsEnabled()
{
return GetStaticInstance().m_enabled;
}

// call TraceTotalNumberOfSteps() to set the total number of steps
// Calling this with totalNumberOfSteps>0 will enable progress tracing.
static void TraceTotalNumberOfSteps(size_t totalNumberOfSteps)
Expand Down
16 changes: 14 additions & 2 deletions Source/Common/Include/TensorShape.h
Original file line number Diff line number Diff line change
Expand Up @@ -383,12 +383,11 @@ struct TensorShape
{
return m_dims == other.m_dims;
}
bool operator!=(const TensorShape& other) const { return !operator==(other); } // duh!

// verify that this refers to a dense matrix (no strides)
void VerifyIsDense() const
{
if (m_offset != 0)
LogicError("TensorShape: A dense TensorShape expected. Offset %d not allowed.", (int) m_offset);
for (size_t k = 0; k < m_dims.size(); k++) // (TODO: we can save one multiplication here)
{
ptrdiff_t stride = k > 0 ? m_strides[k - 1] * (ptrdiff_t) m_dims[k - 1] : 1;
Expand Down Expand Up @@ -622,6 +621,19 @@ struct TensorShape
return *this;
}

// compare two TensorShapes, whether they are compatible, considering padding and broadcasting
bool IsElementwiseCompatibleWith(const TensorShape & other) const
{
for (size_t i = 0; i < m_dims.size(); i++)
{
size_t dim = m_dims[i];
size_t otherDim = i < other.size() ? other[i] : 1;
if (dim != otherDim && dim != 1 && otherDim != 1) // dims mismatch, and neither is broadcasting
return false;
}
return true;
}

// pretty-printing. Returns tensor dims in the form "I x J x K".
operator std::string() const
{
Expand Down
Loading

0 comments on commit 2374adc

Please sign in to comment.