上传备份

6 months ago · 78a8f56309
parent bd63f12893
commit 78a8f56309
4 changed files with 246 additions and 0 deletions
--- a/pom.xml
+++ b/pom.xml
@ -66,6 +66,29 @@
            <version>1.9.3</version> <!-- 请检查最新版本 -->
        </dependency>

+        <!-- Deeplearning4J核心库，包含Word2Vec实现 -->
+        <dependency>
+            <groupId>org.deeplearning4j</groupId>
+            <artifactId>deeplearning4j-core</artifactId>
+            <version>1.0.0-M2.1</version>
+        </dependency>
+        <!-- ND4J数值计算库，Deeplearning4J依赖 -->
+        <dependency>
+            <groupId>org.nd4j</groupId>
+            <artifactId>nd4j-native</artifactId>
+            <version>1.0.0-M2.1</version>
+        </dependency>
+        <dependency>
+            <groupId>org.nd4j</groupId>
+            <artifactId>nd4j-native-platform</artifactId>
+            <version>1.0.0-beta7</version>
+        </dependency>
+        <dependency>
+            <groupId>org.deeplearning4j</groupId>
+            <artifactId>arbiter-ui</artifactId>
+            <version>1.0.0-beta7</version>
+        </dependency>
+
        <!-- 日志框架 -->
        <dependency>
            <groupId>ch.qos.logback</groupId>
--- a/src/main/java/xyz/wbsite/ai/Dl4j_Example.java
+++ b/src/main/java/xyz/wbsite/ai/Dl4j_Example.java
@ -0,0 +1,33 @@
+package xyz.wbsite.ai;
+
+import opennlp.tools.tokenize.TokenizerFactory;
+
+public class Dl4j_Example {
+
+    public static void main(String[] args) {
+//        // 加载文本数据
+//        String filePath = "path/to/your/text/file.txt";
+//        SentenceIterator iter = new BasicLineIterator(new File(filePath));
+//
+//        // 定义分词器
+//        TokenizerFactory t = new DefaultTokenizerFactory();
+//        t.setTokenPreProcessor(new CommonPreprocessor());
+//
+//        // 构建Word2Vec模型
+//        Word2Vec vec = new Word2Vec.Builder()
+//                .minWordFrequency(5)
+//                .iterations(1)
+//                .layerSize(100)
+//                .seed(42)
+//                .windowSize(5)
+//                .iterate(iter)
+//                .tokenizerFactory(t)
+//                .build();
+//
+//        // 训练模型
+//        vec.fit();
+//
+//        // 保存模型
+//        WordVectorSerializer.writeWord2VecModel(vec, "path/to/save/your/model.bin");
+    }
+}
--- a/src/main/java/xyz/wbsite/ai/LeNetMNIST.java
+++ b/src/main/java/xyz/wbsite/ai/LeNetMNIST.java
@ -0,0 +1,155 @@
+package xyz.wbsite.ai;
+
+import org.apache.commons.io.FilenameUtils;
+import org.deeplearning4j.datasets.iterator.impl.MnistDataSetIterator;
+import org.deeplearning4j.nn.conf.MultiLayerConfiguration;
+import org.deeplearning4j.nn.conf.NeuralNetConfiguration;
+import org.deeplearning4j.nn.conf.inputs.InputType;
+import org.deeplearning4j.nn.conf.layers.*;
+import org.deeplearning4j.nn.multilayer.MultiLayerNetwork;
+import org.deeplearning4j.nn.weights.WeightInit;
+import org.deeplearning4j.optimize.api.InvocationType;
+import org.deeplearning4j.optimize.listeners.EvaluativeListener;
+import org.deeplearning4j.optimize.listeners.ScoreIterationListener;
+import org.nd4j.linalg.activations.Activation;
+import org.nd4j.linalg.dataset.api.iterator.DataSetIterator;
+import org.nd4j.linalg.learning.config.Adam;
+import org.nd4j.linalg.lossfunctions.LossFunctions;
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+
+import java.io.File;
+
+/* *****************************************************************************
+ *
+ *
+ *
+ * This program and the accompanying materials are made available under the
+ * terms of the Apache License, Version 2.0 which is available at
+ * https://www.apache.org/licenses/LICENSE-2.0.
+ *  See the NOTICE file distributed with this work for additional
+ *  information regarding copyright ownership.
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
+ * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
+ * License for the specific language governing permissions and limitations
+ * under the License.
+ *
+ * SPDX-License-Identifier: Apache-2.0
+ *
+ * *本计划和随附材料可在
+ * Apache许可证2.0版的条款，可在
+ * https://www.apache.org/licenses/LICENSE-2.0.
+ * 有关更多信息，请参阅随此作品分发的通知文件
+ * 关于版权所有权的信息。
+ *
+ * 除非适用法律要求或书面同意，否则软件
+ * 根据许可证分发的内容是按“原样”分发的，没有
+ * 任何明示或暗示的保证或条件。请参阅
+ * 特定语言的许可证管理权限和限制
+ * 根据许可证。
+ *
+ *SPDX许可证标识符：Apache-2.0
+ ******************************************************************************/
+public class LeNetMNIST {
+    private static final Logger log = LoggerFactory.getLogger(LeNetMNIST.class);
+
+    public static void main(String[] args) throws Exception {
+        int nChannels = 1; // Number of input channels 输入通道数量
+        int outputNum = 10; // The number of possible outcomes 可能结果的数量
+        int batchSize = 64; // Test batch size 试验批量
+        int nEpochs = 1; // Number of training epochs 训练周期数
+        int seed = 123; //
+
+        /*
+         * Create an iterator using the batch size for one iteration
+         * 使用一次迭代的批大小创建迭代器
+         */
+        log.info("Load data....");
+        DataSetIterator mnistTrain = new MnistDataSetIterator(batchSize, true, 12345);
+        DataSetIterator mnistTest = new MnistDataSetIterator(batchSize, false, 12345);
+
+        /*
+         * Construct the neural network
+         * 构建神经网络
+         */
+        log.info("Build model....");
+
+        MultiLayerConfiguration conf = new NeuralNetConfiguration.Builder()
+                .seed(seed)
+                .l2(0.0005)
+                .weightInit(WeightInit.XAVIER)
+                .updater(new Adam(1e-3))
+                .list()
+                .layer(new ConvolutionLayer.Builder(5, 5)
+                        //nIn and nOut specify depth. nIn here is the nChannels and nOut is the number of filters to be applied
+                        //nIn和nOut指定深度。n这里是nChannel，nOut是要应用的过滤器数量
+                        .nIn(nChannels)
+                        .stride(1, 1)
+                        .nOut(20)
+                        .activation(Activation.IDENTITY)
+                        .build())
+                .layer(new SubsamplingLayer.Builder(PoolingType.MAX)
+                        .kernelSize(2, 2)
+                        .stride(2, 2)
+                        .build())
+                .layer(new ConvolutionLayer.Builder(5, 5)
+                        //Note that nIn need not be specified in later layers
+                        //请注意，不需要在后面的层中指定nIn
+                        .stride(1, 1)
+                        .nOut(50)
+                        .activation(Activation.IDENTITY)
+                        .build())
+                .layer(new SubsamplingLayer.Builder(PoolingType.MAX)
+                        .kernelSize(2, 2)
+                        .stride(2, 2)
+                        .build())
+                .layer(new DenseLayer.Builder().activation(Activation.RELU)
+                        .nOut(500).build())
+                .layer(new OutputLayer.Builder(LossFunctions.LossFunction.NEGATIVELOGLIKELIHOOD)
+                        .nOut(outputNum)
+                        .activation(Activation.SOFTMAX)
+                        .build())
+                .setInputType(InputType.convolutionalFlat(28, 28, 1)) //See note below
+                .build();
+
+        /*
+         * Regarding the .setInputType(InputType.convolutionalFlat(28,28,1)) line: This does a few things.
+         * (a) It adds preprocessors, which handle things like the transition between the convolutional/subsampling layers
+         *     and the dense layer
+         * (b) Does some additional configuration validation
+         * (c) Where necessary, sets the nIn (number of input neurons, or input depth in the case of CNNs) values for each
+         *     layer based on the size of the previous layer (but it won't override values manually set by the user)
+         * InputTypes can be used with other layer types too (RNNs, MLPs etc) not just CNNs.
+         * For normal images (when using ImageRecordReader) use InputType.convolutional(height,width,depth).
+         * MNIST record reader is a special case, that outputs 28x28 pixel grayscale (nChannels=1) images, in a "flattened"
+         * row vector format (i.e., 1x784 vectors), hence the "convolutionalFlat" input type used here.
+         *
+         * 关于.setInputType（InputType.convolutionalFlat（28,28,1））行：这做了一些事情。
+         * （a） 它添加了预处理器，处理卷积/子采样层之间的转换等事情
+         * 致密层
+         * （b） 是否进行了一些额外的配置验证
+         * （c） 必要时，为每个神经元设置nIn（输入神经元数量，或CNN情况下的输入深度）值
+         * 基于上一层大小的层（但它不会覆盖用户手动设置的值）
+         * InputTypes也可以与其他层类型（RNN、MLP等）一起使用，而不仅仅是CNN。
+         * 对于普通图像（使用ImageRecordReader时），请使用InputType.convolutional（高度、宽度、深度）。
+         * MNIST记录读取器是一种特殊情况，它以“平坦”的方式输出28x28像素灰度（nCannels=1）图像
+         * 行向量格式（即1x784向量），因此这里使用的是“卷积平面”输入类型。
+         */
+
+        MultiLayerNetwork model = new MultiLayerNetwork(conf);
+        model.init();
+
+        log.info("Train model...");
+        model.setListeners(new ScoreIterationListener(10), new EvaluativeListener(mnistTest, 1, InvocationType.EPOCH_END)); //Print score every 10 iterations and evaluate on test set every epoch
+        model.fit(mnistTrain, nEpochs);
+
+        String path = FilenameUtils.concat(System.getProperty("java.io.tmpdir"), "lenetmnist.zip");
+
+        log.info("Saving model to tmp folder: " + path);
+        model.save(new File(path), true);
+
+        log.info("****************Example finished********************");
+    }
+}
--- a/src/main/java/xyz/wbsite/ai/Word2Vec_Example.java
+++ b/src/main/java/xyz/wbsite/ai/Word2Vec_Example.java
@ -0,0 +1,35 @@
+package xyz.wbsite.ai;
+
+import org.deeplearning4j.models.embeddings.loader.WordVectorSerializer;
+import org.deeplearning4j.models.word2vec.Word2Vec;
+import org.deeplearning4j.text.sentenceiterator.LineSentenceIterator;
+import org.deeplearning4j.text.sentenceiterator.SentenceIterator;
+
+import java.io.File;
+
+public class Word2Vec_Example {
+
+    public static void main(String[] args) {
+
+        try {
+            //加载数爬虫分词数据集
+            String wordLib = "wordLib.lib";
+            String vecModel = "vecModel.model";
+            SentenceIterator iter = new LineSentenceIterator(new File(wordLib));
+            Word2Vec vec = new Word2Vec.Builder()
+                    .minWordFrequency(5)
+                    .iterations(1)
+                    .layerSize(100)
+                    .seed(42)
+                    .windowSize(5)
+                    .iterate(iter)
+                    .build();
+            vec.fit();
+            //保存模型之前先删除
+            new File(vecModel).delete();//删除
+            WordVectorSerializer.writeWordVectors(vec, vecModel);
+        } catch (Exception e) {
+            e.printStackTrace();
+        }
+    }
+}