android - 在预览camerax android中获取所有文本框-6ren

android - 在预览camerax android中获取所有文本框

转载作者：行者123 更新时间：2023-12-05 00:02:39

我想分析我在预览相机中的框内的所有文本。但是我得到了错误的文本坐标。

验证在 contains 上完成

class TestsPhotoscan : AppCompatActivity() {
private lateinit var binding: ActivityMainBinding
private var scaleX = 1F
private var scaleY = 1F
private var rectCrop = Rect()
private var cameraProvider: ProcessCameraProvider? = null
private lateinit var cameraProviderListenableFuture: ListenableFuture<ProcessCameraProvider>

override fun onCreate(savedInstanceState: Bundle?) {
    super.onCreate(savedInstanceState)
    binding = ActivityMainBinding.inflate(layoutInflater)
    setContentView(binding.root)

    cameraProviderListenableFuture = ProcessCameraProvider.getInstance(this)

    // Request camera permissions
    if (allPermissionsGranted()) {
        startCamera()
    } else {
        ActivityCompat.requestPermissions(
            this,
            REQUIRED_PERMISSIONS,
            REQUEST_CODE_PERMISSIONS
        )
    }

    binding.borderView.viewTreeObserver.addOnGlobalLayoutListener(object :
        ViewTreeObserver.OnGlobalLayoutListener {
        override fun onGlobalLayout() {
            binding.borderView.viewTreeObserver.removeOnGlobalLayoutListener(this)
            val points = IntArray(2)
            binding.borderView.getLocationOnScreen(points)
            rectCrop = Rect(
                points[0],
                points[1],
                points[0] + binding.borderView.width,
                points[1] + binding.borderView.height
            )
        }
    })
}


private fun allPermissionsGranted() = REQUIRED_PERMISSIONS.all {
    ContextCompat.checkSelfPermission(
        this, it
    ) == PackageManager.PERMISSION_GRANTED
}

@SuppressLint("UnsafeExperimentalUsageError")
private fun startCamera() {

    cameraProviderListenableFuture.addListener(Runnable {
        cameraProvider = cameraProviderListenableFuture.get()
        binding.viewFinder.post { setupCamera() }
    }, ContextCompat.getMainExecutor(this))

}

private fun buildPreviewUseCase(): Preview {
    val display = binding.viewFinder.display
    val metrics = DisplayMetrics().also { display.getMetrics(it) }
    val preview = Preview.Builder()
        .setTargetRotation(display.rotation)
        .setTargetResolution(Size(metrics.widthPixels, metrics.heightPixels))
        .build()
        .apply {
            setSurfaceProvider(binding.viewFinder.surfaceProvider)
        }

    return preview
}

private fun setupCamera() {

    cameraProviderListenableFuture.addListener({

        // Preview
        val preview = buildPreviewUseCase()

        val imageAnalyzer = ImageAnalysis.Builder()
            .build()
            .also {
                it.setAnalyzer(ContextCompat.getMainExecutor(this),
                    { processImage(it) })
            }

        // Select back camera as a default
        val cameraSelector = CameraSelector.DEFAULT_BACK_CAMERA

        val useCaseGroup = UseCaseGroup.Builder()
            .addUseCase(preview)
            .addUseCase(imageAnalyzer)
            .build()

        try {
            // Unbind use cases before rebinding
            cameraProvider?.unbindAll()

            // Bind use cases to camera
            cameraProvider?.bindToLifecycle(
                this, cameraSelector, useCaseGroup
            )

        } catch (exc: Exception) {
            Log.e(TAG, "Use case binding failed", exc)
        }

    }, ContextCompat.getMainExecutor(this))
}

@SuppressLint("UnsafeOptInUsageError")
private fun processImage(imageProxy: ImageProxy) {

    setScaleFactor(imageProxy)
    recognizeText(
        InputImage. fromMediaImage(
            imageProxy.image!!,
            imageProxy.imageInfo.rotationDegrees
        )
    ).addOnCompleteListener { imageProxy.close() }
}

private fun setScaleFactor(imageProxy: ImageProxy) {
    val viewWidth = binding.viewFinder.width.toFloat()
    val viewHeight = binding.viewFinder.height.toFloat()
    val imageWidth = imageProxy.width.toFloat()
    val imageHeight = imageProxy.height

    scaleX = viewWidth / imageWidth
    scaleY = viewHeight / imageHeight
}

private fun recognizeText(image: InputImage): Task<Text> {

    val recognizer = TextRecognition.getClient(TextRecognizerOptions.DEFAULT_OPTIONS)

    return recognizer.process(image)
        .addOnSuccessListener(
            ScopedExecutor(TaskExecutors.MAIN_THREAD),
            OnSuccessListener<Text> {
                for (block in it.textBlocks) {
                    for (line in block.lines) {
                        for (element in line.elements) {
                            if (rectCrop.contains(
                                    translateX(element.boundingBox?.left ?: -1).roundToInt(),
                                    translateY(element.boundingBox?.top ?: -1).roundToInt()
                                )
                            ) {
                           
                            println(element.text)
                           }
                        }
                    }
                }
                
            })
}

override fun onRequestPermissionsResult(
    requestCode: Int,
    permissions: Array<out String>,
    grantResults: IntArray
) {
    super.onRequestPermissionsResult(requestCode, permissions, grantResults)
    if (requestCode == REQUEST_CODE_PERMISSIONS) {
        if (allPermissionsGranted()) {
            startCamera()
        } else {
            Toast.makeText(
                this,
                "Permissions not granted by the user.",
                Toast.LENGTH_SHORT
            ).show()
            // finish()
        }
        return
    }
}


companion object {
    private const val TAG = "Mytag"
    private const val REQUEST_CODE_PERMISSIONS = 10
    private val REQUIRED_PERMISSIONS = arrayOf(Manifest.permission.CAMERA)
}

fun translateX(x: Int) =
    x * scaleX

fun translateY(y: Int) = y * scaleY

}
和布局

<?xml version="1.0" encoding="utf-8"?>
<layout xmlns:app="http://schemas.android.com/apk/res-auto">
<androidx.constraintlayout.widget.ConstraintLayout                                          
xmlns:android="http://schemas.android.com/apk/res/android"
android:layout_width="match_parent"
android:id="@+id/root"
android:layout_height="match_parent">

<androidx.camera.view.PreviewView
    android:id="@+id/viewFinder"
    android:layout_width="0dp"
    android:layout_height="0dp"
    app:layout_constraintBottom_toBottomOf="parent"
    app:layout_constraintEnd_toEndOf="parent"
    app:layout_constraintStart_toStartOf="parent"
    app:layout_constraintTop_toTopOf="parent" />

<View
    android:id="@+id/border_view"
    android:layout_width="match_parent"
    android:layout_height="250dp"
    android:layout_margin="16dp"
    android:background="@drawable/background_drawable"
    app:layout_constraintBottom_toBottomOf="@+id/viewFinder"
    app:layout_constraintEnd_toEndOf="parent"
    app:layout_constraintStart_toStartOf="parent"
    app:layout_constraintTop_toTopOf="parent" />

   </androidx.constraintlayout.widget.ConstraintLayout>
   </layout>

最佳答案

您遇到的困难是获得从 ImageProxy 中的图像到 PreviewView 显示的图像的良好映射。虽然这听起来很容易，但我不相信有直接的方法来进行这种映射。见answer到一个类似的问题。我查看了实现此答案中的每个建议，尽管它们在某些情况下有效，但在其他情况下却失败了。当然，我可能采取了错误的方法。
我得出的结论是，提取和分析从预览区域提取的位图并识别那些完全被红色矩形包围的单词是最简单的。我用它们自己的红色矩形框住这些词，以表明它们已被正确识别。

以下是重新设计的 Activity ，一个图形叠加层生成了用于显示的单词框和 XML。注释在代码中。祝你好运!
TestPhotoscan.kt

class TestsPhotoscan : AppCompatActivity() {
    private lateinit var binding: ActivityMainBinding
    private var wordFenceRect = Rect()
    private var cameraProvider: ProcessCameraProvider? = null
    private lateinit var cameraProviderListenableFuture: ListenableFuture<ProcessCameraProvider>

    override fun onCreate(savedInstanceState: Bundle?) {
        super.onCreate(savedInstanceState)
        binding = ActivityMainBinding.inflate(layoutInflater)
        setContentView(binding.root)

        cameraProviderListenableFuture = ProcessCameraProvider.getInstance(this)

        // Request camera permissions
        if (allPermissionsGranted()) {
            startCamera()
        } else {
            ActivityCompat.requestPermissions(
                this,
                REQUIRED_PERMISSIONS,
                REQUEST_CODE_PERMISSIONS
            )
        }
    }

    private fun allPermissionsGranted() = REQUIRED_PERMISSIONS.all {
        ContextCompat.checkSelfPermission(
            this, it
        ) == PackageManager.PERMISSION_GRANTED
    }

    @SuppressLint("UnsafeExperimentalUsageError")
    private fun startCamera() {
        cameraProviderListenableFuture.addListener({
            cameraProvider = cameraProviderListenableFuture.get()
            binding.viewFinder.post { setupCamera() }
        }, ContextCompat.getMainExecutor(this))
    }

    private fun buildPreviewUseCase(): Preview {
        val display = binding.viewFinder.display
        val metrics = DisplayMetrics().also { display.getRealMetrics(it) }
        val rotation = display.rotation

        return Preview.Builder()
            .setTargetResolution(Size(metrics.widthPixels, metrics.heightPixels))
            .setTargetRotation(rotation)
            .build()
            .apply {
                setSurfaceProvider(binding.viewFinder.surfaceProvider)
            }
    }

    @SuppressLint("UnsafeOptInUsageError")
    private fun setupCamera() {
        cameraProviderListenableFuture.addListener({

            // Preview
            val preview = buildPreviewUseCase()

            val imageAnalyzer = ImageAnalysis.Builder()
                .build()
                .also { it ->
                    it.setAnalyzer(ContextCompat.getMainExecutor(this),
                        { processImage(it) })
                }

            // Select back camera as a default
            val cameraSelector = CameraSelector.DEFAULT_BACK_CAMERA

            val useCaseGroup = UseCaseGroup.Builder()
                .addUseCase(preview)
                .addUseCase(imageAnalyzer)
                .build()

            try {
                // Unbind use cases before rebinding
                cameraProvider?.unbindAll()

                // Bind use cases to camera
                cameraProvider?.bindToLifecycle(
                    this, cameraSelector, useCaseGroup
                )

            } catch (exc: Exception) {
                Log.e(TAG, "Use case binding failed", exc)
            }

        }, ContextCompat.getMainExecutor(this))
    }

    @SuppressLint("UnsafeOptInUsageError")
    private fun processImage(imageProxy: ImageProxy) {
        // This code will display the image available in the ImageProxy within an inset view
        // if the inset view is visible to the user.
        //
        // The source for ImageUtils is at
        // https://github.com/googlesamples/mlkit/blob/master/android/translate-showcase/app/src/main/java/com/google/mlkit/showcase/translate/util/ImageUtils.kt
        if (binding.insetView.visibility == View.VISIBLE) {
            var imageBitmap = ImageUtils.convertYuv420888ImageToBitmap(imageProxy.image!!)
            imageBitmap = rotateBitmap(imageBitmap, imageProxy.imageInfo.rotationDegrees.toFloat())
            binding.insetView.setImageBitmap(imageBitmap)
        }

        // PreviewViews allow access to a bitmap representation of what the preview shows. This is
        // just a whole lot easier than mapping the ImageProxy image to what the PreviewView
        // displays on the screen.  See https://stackoverflow.com/a/63912198/6287910
        binding.viewFinder.bitmap?.apply {
            recognizeText(
                InputImage.fromBitmap(this, 0)
            ).addOnCompleteListener { imageProxy.close() }
        }
    }

    private fun recognizeText(image: InputImage): Task<Text> {
        val recognizer = TextRecognition.getClient(TextRecognizerOptions.DEFAULT_OPTIONS)

        return recognizer.process(image)
            .addOnSuccessListener(
                ScopedExecutor(TaskExecutors.MAIN_THREAD),
                {
                    binding.wordFence.clearBoxes()
                    binding.wordFence.getHitRect(wordFenceRect)
                    for (block in it.textBlocks) {
                        for (line in block.lines) {
                            for (element in line.elements) {
                                // For each word, check to make sure that the entire word is
                                // contained with the word fence.
                                if (isRectWithinRect(element.boundingBox, wordFenceRect)) {
                                    // Change the box boundary from the coordinate system of the
                                    // parent to the coordinates of the word fence.
                                    val outlineBox = Rect(element.boundingBox)
                                    outlineBox.offset(
                                        -binding.wordFence.left,
                                        -binding.wordFence.top
                                    )
                                    binding.wordFence.addBox(outlineBox)
                                }
                            }
                        }
                    }
                    binding.wordFence.invalidate()
                })
    }

    override fun onRequestPermissionsResult(
        requestCode: Int,
        permissions: Array<out String>,
        grantResults: IntArray
    ) {
        super.onRequestPermissionsResult(requestCode, permissions, grantResults)
        if (requestCode == REQUEST_CODE_PERMISSIONS) {
            if (allPermissionsGranted()) {
                startCamera()
            } else {
                Toast.makeText(
                    this,
                    "Permissions not granted by the user.",
                    Toast.LENGTH_SHORT
                ).show()
                // finish()
            }
            return
        }
    }

    private fun isRectWithinRect(enclosedRect: Rect?, enclosingRect: Rect) =
        enclosedRect != null && enclosingRect.contains(enclosedRect)

    private fun rotateBitmap(bitmap: Bitmap, rotation: Float) =
        Matrix().run {
            preRotate(rotation)
            Bitmap.createBitmap(
                bitmap, 0, 0, bitmap.width, bitmap.height, this, true
            )
        }

    companion object {
        private const val TAG = "Applog"
        private const val REQUEST_CODE_PERMISSIONS = 10
        private val REQUIRED_PERMISSIONS = arrayOf(Manifest.permission.CAMERA)
    }
}

BoxedWordView.kt

class BoxedWordView @JvmOverloads constructor(
    context: Context, attrs: AttributeSet? = null, defStyleAttr: Int = 0
) : View(context, attrs, defStyleAttr) {

    private val mBoxes = mutableListOf<Rect>()
    private val mPaint = Paint().apply {
        strokeWidth = 2f
        color = context.resources.getColor(android.R.color.holo_red_light)
        style = Paint.Style.STROKE
    }

    override fun onDrawForeground(canvas: Canvas) {
        super.onDrawForeground(canvas)
        for (box in mBoxes) {
            drawBox(canvas, box)
        }
    }

    private fun drawBox(canvas: Canvas, box: Rect) {
        canvas.drawRect(box, mPaint)
    }

    fun addBox(box: Rect) {
        mBoxes.add(box)
    }

    fun clearBoxes() {
        mBoxes.clear()
    }
}

activity_main.xml

<layout>

    <androidx.constraintlayout.widget.ConstraintLayout
        android:id="@+id/root"
        android:layout_width="match_parent"
        android:layout_height="match_parent"
        android:background="@android:color/darker_gray">

        <androidx.camera.view.PreviewView
            android:id="@+id/viewFinder"
            android:layout_width="0dp"
            android:layout_height="0dp"
            app:layout_constraintBottom_toBottomOf="parent"
            app:layout_constraintEnd_toEndOf="parent"
            app:layout_constraintStart_toStartOf="parent"
            app:layout_constraintTop_toTopOf="parent" />

        <ImageView
            android:id="@+id/insetView"
            android:layout_width="wrap_content"
            android:layout_height="wrap_content"
            android:visibility="invisible"
            app:layout_constraintBottom_toBottomOf="parent"
            app:layout_constraintStart_toStartOf="parent"
            tools:srcCompat="@tools:sample/backgrounds/scenic" />

        <com.example.textrecognition.BoxedWordView
            android:id="@+id/wordFence"
            android:layout_width="0dp"
            android:layout_height="250dp"
            android:layout_margin="16dp"
            android:background="@drawable/background_drawable"
            app:layout_constraintBottom_toBottomOf="@+id/viewFinder"
            app:layout_constraintEnd_toEndOf="@id/viewFinder"
            app:layout_constraintStart_toStartOf="@id/viewFinder"
            app:layout_constraintTop_toTopOf="@id/viewFinder" />
    </androidx.constraintlayout.widget.ConstraintLayout>
</layout>

我会提到，从“最近”列表返回时，该应用程序有时会卡住。我可能已经介绍了这个问题，但请注意它。

关于android - 在预览camerax android中获取所有文本框，我们在Stack Overflow上找到一个类似的问题： https://stackoverflow.com/questions/68730714/

文章推荐： java - 如何使用android中的回收器 View 将事件放入日历中

文章推荐： SQL代码更新表

文章推荐： java - FragmentDirections 生成成功但无法解析符号

javascript - 将数据从应用程序组件[文本框]传递到网站组件[文本框]
我正在为一个网站开发应用程序(我无法访问该网站)。所以我想做以下事情: 那么如何将文本数据从 Android View 传递到网页中的文本框并捕获来自网站的响应？我试图记住这一切我无法访问任何网站
Silverlight 文本框
我有一个文本框，里面有一个很长的 url。我想做的是，当用户点击主页按钮时，我希望光标移动到文本框的开头。我希望这是正常行为，但事实并非如此，当文本框内的文本很长时，我点击回家，它会转到文本框中当前
带有图像的 WPF 文本框
我正在做一个WPF登录界面。在我的登录面板中，我有一个登录 TextBox和 PasswordBox .如下图第一张所示，登录文本框中有一个小人类标志，密码框中有一个锁。我将图像设置为文本框背景，然后
wpf - 文本框 - 水平文本居中
是否有任何简单的方法可以使文本在文本框中居中？我正在寻找一些内置函数，但什么也没找到。最佳答案将 TextAlignment 属性设置为 Center: 关于wpf - 文本框 - 水平文本居中
Powershell 文本框 SecureString
是否可以使用 System.Windows.Forms.TextBox(或任何其他方法)输入可随后转换为安全字符串的文本？我希望能够获取输入的值，将其转换为安全字符串并将其写入一个文件，然后可以在需要
Powershell 文本框 SecureString
是否可以使用 System.Windows.Forms.TextBox(或任何其他方法)输入可随后转换为安全字符串的文本？我希望能够获取输入的值，将其转换为安全字符串并将其写入一个文件，然后可以在需要
java - Android 文本框
我想将纬度和经度的值返回到我的 EditText 中，我已经能够使用 Toast 来做到这一点，但没有通过实现它>编辑文本。请帮忙 // EditText latEditText =
Jquery Iframe 文本框
我是Jquery新手，其实我对JQuery的使用知识是0。我正在尝试使用 JQuery 来实现某些功能。我有一个带有 iframe 的 html 页面。 iframe 页面中有一个表单和一个文本框。
c# - 在动态创建的事件处理程序中访问动态创建的控件(文本框)
我正在尝试在 Button 的事件处理程序中访问我在 C# 中动态创建的 TextBox。 void MainFormLoad(object sender, EventArgs e)
javascript - 文本框 -> 立即开始输入而不是单击文本框
我有一个搜索栏，当我打开搜索栏时，我想立即开始输入，不想点击文本框。我尝试使用 myTextBoxId.click()(因为当您单击它时，您可以开始输入)但它不起作用。最佳答案你必须 docum
Javascript 文本框 "Scrubber"
我还没有找到好的解决方案:我有一个文本框，用户需要能够在其中输入特定信息。例如，命令可能是“9030 OUT FU [1234 TEST]”。我需要“擦洗”这个文本框以确保数据是以这种格式输入的(不
Java 文本框 - 将字节转换为字符串
我有一个 Java 应用程序，您可以在其中将字符串输入文本框，点击加密，它会在单独的文本框中显示加密的字符串。我将为此使用 AES 加密。问题是我无法让加密文本按字节显示，但文本框不会显示字节(仅采用
html - 文本框，将文本带到文本框中的下一行
我已经浏览了您庞大的问题数据库，但似乎没有找到答案。我在将文本换行时遇到问题 - 即使之前的行上仍有空间。这是代码: p1 { border-left: 6px solid blue; bac
javascript - 如何触发按钮打开用户输入/文本框
所以我正在尝试创建“看板/待办事项列表”网站，但我在触发添加按钮时遇到了问题。我试图触发“添加”按钮以打开用户输入框。所以我有这个创建一个小框的“添加”按钮。但我无法弄清楚如何在该框中添加一个小区域，
javascript - JavaScript 文本框
我有一个文本框，应该只接受浮点值。它不应该允许任何其他值。怎么做。我在 HTML 中完成了此操作。 Weight 但是，它不起作用？如何做到这一点。最佳答案 // remo
javascript - 文本框 - 如何不显示已填充的值
当用户点击文本框时，如何不显示出现在文本框下方的已填充值最佳答案将这个属性放在你的文本框中 autocomplete="off" 关于javascript - 文本框 - 如何不显示已填充的值，我
javascript - flex 文本框
JavaScript: function resize(elem){ if(!elem.value.length) elem.size=1; else elem.size=elem.value
带有两个按钮的 HTML 文本框
在我的代码下面，我需要它具有相同的宽度和高度，但有多行“从第一行开始”，当到达行尾时转到新行，只有 120 个字符，就像我用“Enter短信”当您向右单击时隐藏，但我需要它为灰色。最佳答案您可以使
C#、文本框、.NET
我有一个问题，我必须创建一种方法来搜索显示在多个文本框 (lblResult.Text) 中的选定文本文件的内容。使用简单的搜索算法:搜索用户输入的整个搜索词。例如，如果用户输入“hello”，则只搜
c# - 文本框.SelectionStart
我正在尝试对文本框使用 SelectionStart 和 SelectionLength 属性。它没有效果，但也没有错误。它实际上是后台工作程序 ProgressChanged 方法的一部分，但我已经

行者123

个人简介

我是一名优秀的程序员,十分优秀！

作者热门文章

滴滴打车优惠券免费领取

全站热门文章

首页

博学

6Ren·AI

商城

android - 在预览camerax android中获取所有文本框